flowchart TB
A[Corpus of documents] --> B[Document-feature matrix<br>'Bag of Words']
B --> C[Supervised<br>known categories]
B --> D[Unsupervised<br>unknown categories]
C --> E[Dictionary &<br>Sentiment]
C --> F[Wordscores &<br>Classifiers]
D --> G[Topic Models]
D --> H[Wordfish]
B --> I[Word Embeddings<br>Word2Vec, GloVe]
I -.-> J[Transformers<br>Attention mechanism]
J -.-> K[Large Language<br>Models]
style A fill:#b8d4e8,stroke:#333
style B fill:#b8d4e8,stroke:#333
style C fill:#b8d4e8,stroke:#333
style D fill:#b8d4e8,stroke:#333
style E fill:#b8d4e8,stroke:#333
style F fill:#b8d4e8,stroke:#333
style G fill:#b8d4e8,stroke:#333
style H fill:#b8d4e8,stroke:#333
style I fill:#b8d4e8,stroke:#333
style J fill:#f0e68c,stroke:#333
style K fill:#f0e68c,stroke:#333

