3.2 KiB
3.2 KiB
Imported modules¶
In [1]:
import json import scrapping import psycopg2 from psycopg2.extras import execute_batch import re import logging import datetime logging.basicConfig( level=logging.INFO, filename=f'{datetime.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")}.log', filemode='w', format='%(name)s - %(levelname)s - %(message)s', datefmt='%d-%b-%y %H:%M:%S') # from psycopg2.extensions import register_adapter
In [3]:
conn = psycopg2.connect("dbname='dh' user='dh' host='dh.saret.tk' password='qwerty'") connection = conn.cursor() with open('project_list') as f: for project in f.read().split('\n'): # connection = connection.execute("insert into raw_texts values (%(id_text)s, %(project_name)s, %(raw_text)s)", scrap) scrap = scrapping.get_raw_english_texts_of_project(project) try: execute_batch(connection, "insert into raw_texts values (%(id_text)s, %(project_name)s, %(raw_text)s)", scrap) conn.commit() except Exception: with open(project, 'w') as f: f.write(json.dumps(scrap)) logging.error(f"Error in {project}:{Exception}")
In [33]:
conn = psycopg2.connect("dbname='dh' user='dh' host='dh.saret.tk' password='qwerty'") connection = conn.cursor() logging.basicConfig( level=logging.INFO, filename=f'./now.log', format='%(name)s - %(levelname)s - %(message)s') logging.info('Start') with open('project_list') as f: project = f.read().split('\n')[2] scrap = scrapping.get_raw_english_texts_of_project(project) execute_batch(connection, "insert into raw_texts values (%(id_text)s, %(project_name)s, %(raw_text)s)", scrap) conn.commit()
In [44]:
In [ ]:
In [ ]: