feat: rewrite pseudonyme generator in rust
This commit is contained in:
33
download_data.py
Normal file
33
download_data.py
Normal file
@@ -0,0 +1,33 @@
|
||||
import nltk
|
||||
import os
|
||||
|
||||
def main():
|
||||
# Load the corpora
|
||||
nltk.download('wordnet')
|
||||
nltk.download('averaged_perceptron_tagger')
|
||||
nltk.download('universal_tagset')
|
||||
|
||||
# Get all the adjectives and nouns
|
||||
adjectives = set()
|
||||
nouns = set()
|
||||
for synset in nltk.corpus.wordnet.all_synsets():
|
||||
for lemma in synset.lemmas():
|
||||
if lemma.name().isalpha():
|
||||
if synset.pos() == 'a':
|
||||
adjectives.add(lemma.name())
|
||||
elif synset.pos() == 'n':
|
||||
nouns.add(lemma.name())
|
||||
|
||||
# Create the output directory if it doesn't exist
|
||||
os.makedirs('data', exist_ok=True)
|
||||
|
||||
with open('data/adjectives.txt', 'w+') as file:
|
||||
for adjective in adjectives:
|
||||
file.write(str(adjective).capitalize() + '\n')
|
||||
|
||||
with open('data/nouns.txt', 'w+') as file:
|
||||
for noun in nouns:
|
||||
file.write(str(noun).capitalize() + '\n')
|
||||
|
||||
if __name__ == '__main__':
|
||||
main()
|
||||
Reference in New Issue
Block a user