Commit 9e8d051b authored by Vasyl Bodnaruk's avatar Vasyl Bodnaruk

Add functional for take data from DB

parent 7b68057f
# -*- coding: utf-8 -*-
import scrapy
import dateparser
from scrapy.utils.project import get_project_settings
from ..helpers import CompanyMaker, Database
from ..items import ExaItem
db_settings = get_project_settings().get('DB')
db = Database(**db_settings)
class AitopSpider(scrapy.Spider):
name = "aitop"
allowed_domains = ["aitopics.org"]
start_urls = ['https://aitopics.org/search?view=&filters=&sort=score+desc&q=x.ai']
def __init__(self, *args, **kwargs):
self.condition = kwargs.get('query')
self.query = "SELECT id, name, country FROM wp_esi_entity WHERE 1 and id=13"
if self.condition:
print(self.condition)
self.query += ' or {}'.format(self.condition)
super(AitopSpider, self).__init__()
def start_requests(self):
companies = CompanyMaker(db.select(self.query))
companies.make_companies(self.name)
for i in companies.get_companies():
try:
yield scrapy.Request(i.url + '/', callback=self.parse, meta={'company': i, 'post_id': 0})
except:
pass
def parse(self, response):
name = 'Uber'
url = 'https://aitopics.org'
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment