This commit is contained in:
Alexander Popov 2021-02-22 19:36:51 +03:00
parent 05c12b3977
commit a3fa54e67d
6 changed files with 64 additions and 66 deletions

5
.gitignore vendored
View File

@ -1,3 +1,2 @@
.venv/
*~
venv/
words.db

2
CHANGELOG.md Normal file
View File

@ -0,0 +1,2 @@
# 1.0.0 (2021-02-22)
+ Release version

View File

@ -1,6 +1,6 @@
MIT License
Copyright (c) 2020 Alexander Popov
Copyright (c) 2021 Alexander Popov
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal

59
grab.py Executable file
View File

@ -0,0 +1,59 @@
#!/usr/bin/env python3
from time import sleep
import sqlite3
import requests
from bs4 import BeautifulSoup
__author__ = 'Alexander Popov'
__license__ = 'MIT'
__version__ = '1.0.0'
__email__ = 'iiiypuk@fastmail.fm'
def parse():
r = requests.get('https://randomword.com/')
data = r.text
soup = BeautifulSoup(data, 'html.parser')
word = soup.find('div', {'id': 'random_word'}).text
word_definition = soup.find('div', {'id': 'random_word_definition'}).text
new_word = {'word': word, 'definition':
word_definition.replace(' ', '')}
return(new_word)
if __name__ == '__main__':
# dict for new parsed words
words = {}
# open datebase
db = sqlite3.connect('./words.db')
cursor = db.cursor()
# create new table if not exist
try:
cursor.execute('CREATE TABLE words(word text, definition text)')
except sqlite3.OperationalError as e:
print('INFO:', e)
# start parse words
try:
while(True):
sleep(0.5)
new_word = parse()
words[new_word['word']] = new_word['definition']
print('Parsed', new_word['word'])
except KeyboardInterrupt:
for word in words:
cursor.execute(
'INSERT INTO words VALUES ("{word}", "{defin}")'
.format(word=word, defin=words[word]))
db.commit()
print('Saved %d words.' % len(words))

View File

@ -1,58 +0,0 @@
#!/usr/bin/env python3
from bs4 import BeautifulSoup
import requests
import json
from time import sleep
def load_words():
with open('./words.json', encoding='utf-8') as file:
words = json.load(file, encoding='utf-8')
return(words)
def parse():
r = requests.get('https://randomword.com/')
data = r.text
soup = BeautifulSoup(data, 'html.parser')
word = soup.find('div', {'id': 'random_word'}).text
word_definition = soup.find('div', {'id': 'random_word_definition'}).text
new_word = {'word': word, 'definition':
[word_definition.replace(' ', '')]}
return(new_word)
def main(words_data):
while(True):
sleep(0.5)
new_word = parse()
print(new_word)
words_data[new_word['word']] = new_word['definition']
return(words_data)
__author__ = 'Alexander Popov'
__license__ = "MIT"
__version__ = "1.0.1"
__email__ = "iiiypuk@fastmail.fm"
if __name__ == '__main__':
words = {}
words = load_words()
try:
while(True):
words = main(words)
except KeyboardInterrupt:
with open('./words.json', 'w', encoding='utf-8') as file:
file.write(
json.dumps(words, indent=4, ensure_ascii=False))
print('Saved %d words.' % len(words))

View File

@ -1,4 +0,0 @@
{
}