123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209 |
- # -*- encoding: utf-8 -*-
- #
- import os, json, sys, subprocess, urllib.parse, traceback
- import random, time, datetime, re
- from urllib.parse import unquote
- virtual_env = os.path.expanduser('~/projects/world-it-planet/env')
- activate_this = os.path.join(virtual_env, 'bin/activate_this.py')
- exec(open(activate_this).read(), dict(__file__=activate_this))
- import requests
- #MySql
- from mysql.connector import connect, Error
- #декларативное определение SQLLite
- from sqlalchemy import Column, Integer, String, create_engine
- from sqlalchemy.ext.declarative import declarative_base
- from sqlalchemy.orm import sessionmaker
- from sqlalchemy import desc
- #---------------------------------- Variables ----------
- #---------------------------------- Variables End ----------
- def application(env, start_response):
- out_s = {}
- """
- for key in env:
- out_s = out_s + str(key) + "=" + str(env[key]) + "<br>"
- """
- #получаем $_GET из запроса
- get_query = env['QUERY_STRING']
- get_json = get_query.replace("q=", "")
- get_json = unquote(get_json)
- get_dict = json.loads(get_json)
- tm_id = str(get_dict['tm_id'])
- out_s["tm_id"] = tm_id
-
- #Инициализация MySQL
- mysql_connection = connect(
- host="localhost",
- user="id35114350",
- password="Hgatrdy5rTeq",
- database="id35114350_steelfeet",
- charset='utf8',
- use_unicode=True
- )
- #Инициализация SQLLite
- basedir = os.path.abspath(os.path.dirname(__file__))
- SQLALCHEMY_DATABASE_URI = 'sqlite:///' + os.path.join(basedir, 'hhtm.db')
- engine = create_engine(SQLALCHEMY_DATABASE_URI, pool_pre_ping=True)
- Base = declarative_base()
- class Vacancies(Base):
- __tablename__ = 'vacancies'
- id = Column(Integer, primary_key=True, autoincrement=True)
- title = Column(String(512))
- city = Column(String(20))
- specialization = Column(String(255))
- href = Column(String(512))
- donor = Column(String(255))
- vacancy_id = Column(Integer)
- vacancy_date = Column(Integer)
- parse_date = Column(Integer)
- employer = Column(String(255))
- canal_city_id = Column(Integer)
- canal_city_date = Column(Integer)
- canal_spec_id = Column(Integer)
- canal_spec_date = Column(Integer)
- def __init__(self, title, city, specialization, href, donor, vacancy_id, vacancy_date, parse_date, employer, canal_city_id, canal_city_date, canal_spec_id, canal_spec_date):
- self.title = title
- self.city = city
- self.specialization = specialization
- self.href = href
- self.donor = donor
- self.vacancy_id = vacancy_id
- self.vacancy_date = vacancy_date
- self.parse_date = parse_date
- self.employer = employer
- self.canal_city_id = canal_city_id
- self.canal_city_date = canal_city_date
- self.canal_spec_id = canal_spec_id
- self.canal_spec_date = canal_spec_date
- def __repr__(self):
- return "<Vacancy('%s','%s', '%s')>" % (self.title, self.specialization, self.href)
- Session = sessionmaker(bind=engine)
- sqllite_session = Session()
- #------------------------------------------ Основной цикл ------------------
- #запрос wp_id по внешнему сервису
- params = {
- "action":"show_wp_id",
- "tm_id":tm_id
- }
- params_json = json.dumps(params)
- get_wp_url = "https://steelfeet.ru/app/get.php?q=" + params_json
- out_s["get_wp_url"] = get_wp_url
- response = requests.get(get_wp_url)
- wp_id = int(response.text)
- out_s["wp_id"] = wp_id
- now = datetime.datetime.now()
- #просто последние пять спарсенных
- #vacancies = sqllite_session.query(Vacancies).order_by(desc(Vacancies.parse_date))[0:5]
- #отбираем показанные вакансии
- showed_vacancies_query = "SELECT `data_1`, `data_3`, `weight` FROM `sf_log` WHERE (`code` = 'vacancy') AND (`action` = 'show_next') AND (`user_id` = " + str(wp_id) + ");"
- #out_s["showed_vacancies_query"] = showed_vacancies_query
- with mysql_connection.cursor(buffered=True) as cursor:
- cursor.execute(showed_vacancies_query)
- showed_vacancies = cursor.fetchall()
- showed_vacancies_ids = []
- for item in showed_vacancies:
- item_id, item_data_3, item_weight = item
- showed_vacancies_ids.append(item_id)
- #считаем статистику слов
- #отбираем все вакансии
- all_vacancies_query = "SELECT `data_1`, `data_3`, `weight` FROM `sf_log` WHERE (`code` = 'vacancy') AND (`user_id` = " + str(wp_id) + ");"
- with mysql_connection.cursor(buffered=True) as cursor:
- cursor.execute(all_vacancies_query)
- all_vacancies = cursor.fetchall()
- words_stat = {}
- for item in all_vacancies:
- item_id, item_data_3, item_weight = item
-
- words = str(item_data_3).replace('-',' ').replace('/',' ').replace('\\',' ').replace('(','').replace(')','').split(" ")
- for word in words:
- try:
- if (len(word) > 0):
- words_stat[word] = words_stat[word] + item_weight
- except:
- words_stat[word] = item_weight
- out_s["words"] = words_stat
-
- #считаем веса для непоказанных вакансий
- vacancies = sqllite_session.query(Vacancies).order_by(desc(Vacancies.parse_date))[0:500]
-
- vacancies_list = []
- for item in vacancies:
- #непоказанные
- if (not(item.id in showed_vacancies_ids)):
- words = str(item.title).replace('-',' ').replace('/',' ').replace('\\',' ').replace('(','').replace(')','').split(" ")
- vacancy_weight = 0
- for word in words:
- try:
- if (len(word) > 0):
- vacancy_weight = vacancy_weight + words_stat[word]
- except:
- pass
-
- vacancy_item = {
- "id" : item.id,
- "weight" : vacancy_weight,
- "title" : str(item.title),
- "href" : item.href,
- }
- vacancies_list.append(vacancy_item)
- #сортируем по весу
- vacancies_list = sorted(vacancies_list, key=lambda x: x["weight"], reverse=True)
- #выводим лучшие 5
- vacancies_list = vacancies_list[0:5]
- for item in vacancies_list:
- #добавляем показанные вакансии в лог
- #INSERT INTO `sf_log` (`user_id`, `date`, `hour`, `action`, `data_1`, `data_2`, `data_3`, `data_4`, `data`, `weight`) VALUES ('', '', '', '', '', '', '', '', '', '');
- exist_vacancies_query = "SELECT `id` FROM `sf_log` WHERE (`code` = 'vacancy') AND (`data_1` = " + str(item["id"]) + ");"
- with mysql_connection.cursor(buffered=True) as cursor:
- cursor.execute(exist_vacancies_query)
- exist_vacancies = cursor.fetchall()
- if (len(exist_vacancies) == 0):
- mysql_query = "INSERT INTO `sf_log` (`user_id`, `date`, `hour`, `code`, `action`, `data_1`, `data_2`, `data_3`, `data_4`, `data`, `weight`) VALUES ('" + str(wp_id) + "', '" + str(int(time.time())) + "', '" + str(now.hour) + "', 'vacancy', 'show_best', '" + str(item["id"]) + "', '', '" + str(item["title"]) + "', '', 'data_1=>vacancy_id, data_3=>vacancy_title', '');"
-
- with mysql_connection.cursor() as cursor:
- cursor.execute(mysql_query)
- mysql_connection.commit()
- out_s["vacancies"] = vacancies_list
- start_response('200 OK', [('Content-Type','text/html')])
- out_s = json.dumps(out_s)
- b = out_s.encode('utf-8')
- return [b]
|