public_sentiment/web/controller/html_parser_controller.py
2024-09-23 08:44:54 +08:00

34 lines
1007 B
Python

#!/usr/bin/env python
# -*- coding: utf-8 -*-
from django.http import JsonResponse
from rest_framework.decorators import api_view
from rest_framework.views import APIView
from web.controller.base_controller import BaseController
from web.manager.log_manager import LogManager
from web.util.dto_util import DtoUtil
from web.vo.parse_html_vo import ParseHtmlVo
Logger = LogManager.get_logger(__name__)
class HtmlParserController(APIView, BaseController):
@api_view(['POST'])
def parse_html(self, request):
"""
解析html
"""
Logger.info("开始解析html")
parse_html_vo = self.to_vo(request, ParseHtmlVo)
service_result = self.html_parser_handler.parse_html(parse_html_vo.url)
# grid_graph_manager = GridGraphManager()
# list = grid_graph_manager.query_vertex(label='person')
# base_controller.start_scrawl(CollectorSpider)
return JsonResponse(DtoUtil.service_result_to_api_result(service_result), safe=False)