flashbot/words_db.py at main · jbenbee/flashbot · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
import threading

import numpy as np
import pandas as pd


class WordsDB:
    def __init__(self, db_path):
        self.db_path = db_path
        self.words_df = pd.read_csv(self.db_path)
        self.words_df['id'] = self.words_df['id'].astype(int)
        if not self.words_df['id'].is_unique:
            raise ValueError('"id" field in the words database is not unique.')
        self._lock = threading.Lock()

    def save_words_db(self):
        self._lock.acquire()
        self.words_df.to_csv(self.db_path, index=False)
        self._lock.release()

    def get_words_df(self):
        self._lock.acquire()
        wdf_cpy = self.words_df.copy()
        self._lock.release()
        return wdf_cpy

    def get_word_data(self, word, lang):
        self._lock.acquire()
        res = self.words_df.loc[(self.words_df['word'] == word) & (self.words_df['lang'] == lang)].to_dict()
        self._lock.release()
        return res

    def add_new_word(self, word, lang):
        self._lock.acquire()
        word_data = self.words_df.loc[(self.words_df['lang'] == lang) & (self.words_df['word'] == word)]
        if word_data.shape[0] == 0:
            word_id = int(self.words_df['id'].max() + 1)
            self.words_df.loc[len(self.words_df)] = {'id': word_id, 'word': word,
                                                     'lang': lang, 'tags': np.nan}
        elif word_data.shape[0] == 1:
            word_id = int(word_data['id'].item())
        else:
            self._lock.release()
            raise ValueError(f'The same word "{word}" appears >1 time in the database: {word_data}')
        self._lock.release()
        return word_id

    def release_lock(self):
        if self._lock.locked():
            self._lock.release()