1
0
mirror of https://github.com/fhamborg/news-please.git synced 2021-09-19 22:26:00 +03:00
Files
news-please-content-crawler/newsplease/api/server.py
2017-02-06 12:35:24 +01:00

38 lines
911 B
Python

from extractor.document import Document
from extractor.five_w_extractor import FiveWExtractor
from flask import Flask, request, jsonify
import logging
app = Flask(__name__)
log = logging.getLogger(__name__)
host = None
port = 5001
debug = False
options = None
extractor = FiveWExtractor()
ch = logging.StreamHandler()
ch.setLevel(logging.DEBUG)
log.addHandler(ch)
log.setLevel(logging.DEBUG)
def run():
log.info("starting server on port %i", port)
app.run(host, port, debug)
log.info("server has stopped")
@app.route('/crawl', methods=['GET', 'POST'])
def extract():
json_article = request.get_json()
log.debug("retrieved raw article for extraction: %s", json_article['title'])
document = Document(json_article['title'], json_article['description'], json_article['text'])
extractor.parse(document)
return jsonify(document.questions)
if __name__ == "__main__":
run()