From 9d38dfc2b26bc52fb4a5030487dd424d7c40e45d Mon Sep 17 00:00:00 2001
From: Vover <vovatara123@gmail.com>
Date: Fri, 11 Oct 2024 15:49:15 +0400
Subject: [PATCH 01/19] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 358fed9..50f06b0 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,2 @@
 # Tokenizer
-Leatning tokenization for Deep learning and LLms
+Learning tokenization for Deep learning and LLms

From 223c3bdd5a819205c91acd750976e62e70dc7a4f Mon Sep 17 00:00:00 2001
From: Vover <vovatara123@gmail.com>
Date: Sun, 13 Oct 2024 19:04:17 +0400
Subject: [PATCH 02/19] Update README.md

---
 README.md | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 50f06b0..b04c1a9 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,10 @@
-# Tokenizer
-Learning tokenization for Deep learning and LLms
+# SmolBPE
+
+Tokenization for Deep Learning and Large Language Models (LLMs).
+## Description
+
+SmolBPE is a repository focused on providing efficient tokenization techniques for deep learning and large language models. This project is composed primarily of Jupyter Notebooks and Python scripts.
+
+## Features
+
+- Efficient tokenization algorithms.

From d20ad44ed5c2be1cca3c0f92fc52e0a07a613ddc Mon Sep 17 00:00:00 2001
From: Vover <vovatara123@gmail.com>
Date: Sun, 13 Oct 2024 19:08:01 +0400
Subject: [PATCH 03/19] Update README.md

---
 README.md | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/README.md b/README.md
index b04c1a9..30fde64 100644
--- a/README.md
+++ b/README.md
@@ -8,3 +8,13 @@ SmolBPE is a repository focused on providing efficient tokenization techniques f
 ## Features
 
 - Efficient tokenization algorithms.
+
+---- 
+
+## Byte pair encoding
+
+Byte pair encoding (also known as digram coding) is an algorithm, first described in 1994 by Philip Gage for encoding strings of text into tabular form for use in downstream modeling. Its modification is notable as the large language model tokenizer with an ability to combine both tokens that encode single characters (including single digits or single punctuation marks) and those that encode whole words (even the longest compound words). This modification, in the first step, assumes all unique characters to be an initial set of 1-character long n-grams (i.e. initial "tokens"). Then, successively, the most frequent pair of adjacent characters is merged into a new, 2-character long n-gram and all instances of the pair are replaced by this new token. This is repeated until a vocabulary of prescribed size is obtained. Note that new words can always be constructed from final vocabulary tokens and initial-set characters. This algorithmic approach has been extended from spoken language to sign language in recent years.
+
+All the unique tokens found in a corpus are listed in a token vocabulary, the size of which, in the case of GPT-3.5 and GPT-4, is 100256. 
+
+![image](https://github.com/user-attachments/assets/27cf64e5-42a1-470b-baee-fc5a170bb4eb)

From ef3ac4d832dcf571cc70da4f879365ec88298efe Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 16:34:29 +0400
Subject: [PATCH 04/19] feat: enhance GPT4Tokenizer with vocab loading/saving
 and CLI support

---
 smolbpe/gpt4.py | 89 ++++++++++++++++++++++++++++++++++++++-----------
 1 file changed, 70 insertions(+), 19 deletions(-)

diff --git a/smolbpe/gpt4.py b/smolbpe/gpt4.py
index a1f4508..4cb8626 100644
--- a/smolbpe/gpt4.py
+++ b/smolbpe/gpt4.py
@@ -1,12 +1,15 @@
 import regex as re
+import argparse 
+import json
 
 
 class GPT4Tokenizer():
-    def __init__(self):
+    def __init__(self, path='vocab.json', pattern=None):
         self.vocab = {idx : bytes([idx]) for idx in range(256)}
         self.merges = dict()
-        self.pattern = r"""'(?i:[sdmt]|ll|ve|re)|[^\r\n\p{L}\p{N}]?+\p{L}+|\p{N}{1,3}| ?[^\s\p{L}\p{N}]++[\r\n]*|\s*[\r\n]|\s+(?!\S)|\s+"""
+        self.pattern = pattern if pattern else r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]"
         self.splitby = re.compile(self.pattern)
+        self.path = path
 
 
     def train(self, text, vocab_size):
@@ -28,20 +31,28 @@ def train(self, text, vocab_size):
             ids = [self.merge(chunk_ids, pair, idx) for chunk_ids in ids]
             self.merges[pair] = idx
             self.vocab[idx] = self.vocab[pair[0]] + self.vocab[pair[1]]
+        self.save_vocab_and_merges(self.path)
+
 
     
     def encode(self, text):
-        tokens = list(text.encode("utf-8"))
-        while len(tokens)>=2:
-            bigrams = self.get_pairs(tokens)
-            pair = min(bigrams, key = lambda p: bigrams.get(p, float("inf")))
-            if pair not in self.merges:
+        ids = list(text.encode('utf-8'))
+
+        while True:
+            pairs = self.get_pairs(ids)
+            mergeable_pairs = {p: self.merges[p] for p in pairs if p in self.merges}
+
+
+            if not mergeable_pairs:
                 break
-            idx = self.merges[pair]
-            tokens = self.merge(tokens, pair, idx)
-        return tokens
-    
 
+            pair = min(mergeable_pairs, key=self.merges.get)
+
+            ids = self.merge(ids, pair, self.merges[pair])
+
+        return ids
+    
+    
     def decode(self, ids):
         tokens = b"".join(self.vocab[idx] for idx in ids)
         text = tokens.decode("utf-8", errors="replace")
@@ -57,6 +68,41 @@ def get_pairs(self, ids, counts=None):
         return counts
 
 
+    def save_vocab_and_merges(self, path):
+        data = {
+            'vocab': {},
+            'merges': {}
+        }
+        # Save vocab
+        for idx, byte_val in self.vocab.items():
+            try:
+                data['vocab'][str(idx)] = byte_val.decode('utf-8')
+            except UnicodeDecodeError:
+                data['vocab'][str(idx)] = byte_val.hex()
+        # Save merges
+        for (first, second), idx in self.merges.items():
+            key = f"{first},{second}"  # Convert tuple to string
+            data['merges'][key] = idx
+        with open(path, 'w', encoding='utf-8') as f:
+            json.dump(data, f, indent=2)
+            
+            
+    def load_vocab(self, path='vocab.json'):
+        with open(path, 'r', encoding='utf-8') as f:
+            data = json.load(f)
+        # Load vocab
+        self.vocab = {}
+        for idx_str, value in data['vocab'].items():
+            idx = idx_str
+            self.vocab[idx] = value.encode('utf-8')
+        # Load merges
+        self.merges = {}
+        for pair_str, idx in data['merges'].items():
+            first_str, second_str = pair_str.split(',')
+            first, second = int(first_str), int(second_str)
+            self.merges[(first, second)] = idx
+    
+    
     def merge(self, ids, pair, idx):
         id = 0
         newids = []
@@ -70,11 +116,16 @@ def merge(self, ids, pair, idx):
         return newids
 
 
-t = GPT4Tokenizer()
-
-with open("./data/taylorswift.txt", "r") as f:
-    text = f.read()
-
-t.train(text, 400)
-print(t.vocab)
-print(t.decode(t.encode("Hello world")))
+if __name__=='__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument('-t', '--text', type=str, help='Text to train tokenizer on')
+    parser.add_argument('-v','--vocab_size', type=int, help='Vocab size for tokenizer')
+    parser.add_argument('-o', '--output', default='vocab.json', type=str, help='Output path for vocab and merges')
+    parser.add_argument('-p', '--pattern', type=str, help='Regex pattern to split text')
+    args = parser.parse_args()
+    
+    with open(args.text, 'r') as f:
+        args.text = f.read()
+    
+    tokenizer = GPT4Tokenizer(args.output, args.pattern)
+    tokenizer.train(args.text, args.vocab_size)

From 88a080505da18cc30e3e90bae2b6ff187dbbc32a Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 16:38:12 +0400
Subject: [PATCH 05/19] feat: initialize smolbpe module

---
 smolbpe/__init__.py | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 smolbpe/__init__.py

diff --git a/smolbpe/__init__.py b/smolbpe/__init__.py
new file mode 100644
index 0000000..e69de29

From d952b4a0be8d866e08c54987b5991d4e21763e9a Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 17:02:57 +0400
Subject: [PATCH 06/19] feat: add initial implementation of GPT-4 compatible
 tokenizer and setup configuration

---
 MANIFEST.in                            |  2 ++
 setup.py                               | 29 ++++++++++++++++++++++++++
 smolbpe/data/__init__.py               |  0
 {data => smolbpe/data}/taylorswift.txt |  0
 {data => smolbpe/data}/text.py         |  0
 smolbpe/{gpt4.py => gpt4Tokenizer.py}  |  0
 tests/__init__.py                      |  0
 7 files changed, 31 insertions(+)
 create mode 100644 MANIFEST.in
 create mode 100644 setup.py
 create mode 100644 smolbpe/data/__init__.py
 rename {data => smolbpe/data}/taylorswift.txt (100%)
 rename {data => smolbpe/data}/text.py (100%)
 rename smolbpe/{gpt4.py => gpt4Tokenizer.py} (100%)
 create mode 100644 tests/__init__.py

diff --git a/MANIFEST.in b/MANIFEST.in
new file mode 100644
index 0000000..454c748
--- /dev/null
+++ b/MANIFEST.in
@@ -0,0 +1,2 @@
+include smolbpe/data/*.txt
+include smolbpe/data/*.json
\ No newline at end of file
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..3007929
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,29 @@
+from setuptools import setup, find_packages
+
+setup(
+    name='gpt4tokenizer',
+    version='0.1.0',
+    description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
+    author='Vover',
+    author_email='your.email@example.com',
+    url='https://github.com/yourusername/gpt4tokenizer',  # Replace with your repository URL
+    packages=find_packages(include=['smolbpe', 'smolbpe.*']),
+    install_requires=[
+        'regex>=2021.4.4',
+    ],
+    classifiers=[
+        'Programming Language :: Python :: 3',
+        'License :: OSI Approved :: MIT License',
+        'Operating System :: OS Independent',
+    ],
+    python_requires='>=3.6',
+    include_package_data=True,
+    package_data={
+        'smolbpe': ['data/*.txt', 'data/*.json'],
+    },
+    entry_points={
+        'console_scripts': [
+            'gpt4tokenizer=smolbpe.gpt4Tokenizer:main',  # If you have a main function
+        ],
+    },
+)
\ No newline at end of file
diff --git a/smolbpe/data/__init__.py b/smolbpe/data/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/data/taylorswift.txt b/smolbpe/data/taylorswift.txt
similarity index 100%
rename from data/taylorswift.txt
rename to smolbpe/data/taylorswift.txt
diff --git a/data/text.py b/smolbpe/data/text.py
similarity index 100%
rename from data/text.py
rename to smolbpe/data/text.py
diff --git a/smolbpe/gpt4.py b/smolbpe/gpt4Tokenizer.py
similarity index 100%
rename from smolbpe/gpt4.py
rename to smolbpe/gpt4Tokenizer.py
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..e69de29

From 5c74ff8ff94ea1eec42e6ff9de80c923c493c5ce Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 17:15:17 +0400
Subject: [PATCH 07/19] fix: update author email and repository URL in
 setup.py; adjust import path in character_tokenizing.py

---
 setup.py                      | 6 +++---
 tests/character_tokenizing.py | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/setup.py b/setup.py
index 3007929..3d174a8 100644
--- a/setup.py
+++ b/setup.py
@@ -5,8 +5,8 @@
     version='0.1.0',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
     author='Vover',
-    author_email='your.email@example.com',
-    url='https://github.com/yourusername/gpt4tokenizer',  # Replace with your repository URL
+    author_email='vovatara123@gmail.com',
+    url='https://github.com/T4ras123/SmolBPE',  # Replace with your repository URL
     packages=find_packages(include=['smolbpe', 'smolbpe.*']),
     install_requires=[
         'regex>=2021.4.4',
@@ -23,7 +23,7 @@
     },
     entry_points={
         'console_scripts': [
-            'gpt4tokenizer=smolbpe.gpt4Tokenizer:main',  # If you have a main function
+            'gpt4tokenizer=smolbpe.gpt4Tokenizer:main', 
         ],
     },
 )
\ No newline at end of file
diff --git a/tests/character_tokenizing.py b/tests/character_tokenizing.py
index 2ca1aeb..c674426 100644
--- a/tests/character_tokenizing.py
+++ b/tests/character_tokenizing.py
@@ -2,7 +2,7 @@
 import os
 sys.path.append(os.path.abspath('../data'))
 
-from data.text import text
+from smolbpe.data import text
 
 vocab = list(set(text))
 stoi = {ch:i for i, ch in enumerate(vocab)} 

From 0ac5f142a4563c930e2ce082e2c4dfba7badb7b8 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 17:16:44 +0400
Subject: [PATCH 08/19] fix: rename package from gpt4tokenizer to smolbpe in
 setup.py

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index 3d174a8..42f0633 100644
--- a/setup.py
+++ b/setup.py
@@ -1,7 +1,7 @@
 from setuptools import setup, find_packages
 
 setup(
-    name='gpt4tokenizer',
+    name='smolbpe',
     version='0.1.0',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
     author='Vover',

From fb785debf5ad90f6ce00ceadfd695d8a888e006b Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 17:44:04 +0400
Subject: [PATCH 09/19] chore: update README.md with installation instructions
 and usage examples; modify setup.py for long description and version bump;
 include README.md in MANIFEST.in; remove unused test files and refactor
 GPT4Tokenizer class

---
 MANIFEST.in                   |   3 +-
 README.md                     | 154 +++++-
 setup.py                      |   5 +-
 smolbpe/basicTokenizer.py     |  84 ---
 smolbpe/data/__init__.py      |   0
 smolbpe/data/taylorswift.txt  | 988 ----------------------------------
 smolbpe/data/text.py          |   1 -
 smolbpe/gpt4Tokenizer.py      |   8 +-
 tests/__init__.py             |   0
 tests/character_tokenizing.py |  14 -
 tests/tokenization.ipynb      | 651 ----------------------
 tests/word_tokenization.py    |  20 -
 12 files changed, 154 insertions(+), 1774 deletions(-)
 delete mode 100644 smolbpe/basicTokenizer.py
 delete mode 100644 smolbpe/data/__init__.py
 delete mode 100644 smolbpe/data/taylorswift.txt
 delete mode 100644 smolbpe/data/text.py
 delete mode 100644 tests/__init__.py
 delete mode 100644 tests/character_tokenizing.py
 delete mode 100644 tests/tokenization.ipynb
 delete mode 100644 tests/word_tokenization.py

diff --git a/MANIFEST.in b/MANIFEST.in
index 454c748..4d35845 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,2 +1,3 @@
 include smolbpe/data/*.txt
-include smolbpe/data/*.json
\ No newline at end of file
+include smolbpe/data/*.json
+include README.md
\ No newline at end of file
diff --git a/README.md b/README.md
index 30fde64..2846084 100644
--- a/README.md
+++ b/README.md
@@ -1,20 +1,156 @@
 # SmolBPE
 
-Tokenization for Deep Learning and Large Language Models (LLMs).
-## Description
+## Overview
 
-SmolBPE is a repository focused on providing efficient tokenization techniques for deep learning and large language models. This project is composed primarily of Jupyter Notebooks and Python scripts.
+**SmolBPE** is a lightweight and efficient Byte Pair Encoding (BPE) tokenizer designed for deep learning applications and large language models (LLMs) such as GPT-4. It provides a simple interface to tokenize textual data, facilitating better handling of out-of-vocabulary words and improving the performance of language models.
 
 ## Features
 
-- Efficient tokenization algorithms.
+- **Efficient Tokenization**: Implements the BPE algorithm for effective subword tokenization.
+- **Customizable Vocabulary Size**: Allows you to specify the desired vocabulary size according to your needs.
+- **Unicode Support**: Handles a wide range of characters, including Unicode characters, enabling multilingual tokenization.
+- **Easy Integration**: Designed for seamless integration with existing Python projects and NLP pipelines.
+- **Command-Line Interface**: Provides a CLI tool for training and using the tokenizer without writing additional code.
+- **Open Source**: Licensed under the MIT License, promoting openness and collaboration.
 
----- 
+## Installation
 
-## Byte pair encoding
+You can install SmolBPE using `pip`:
 
-Byte pair encoding (also known as digram coding) is an algorithm, first described in 1994 by Philip Gage for encoding strings of text into tabular form for use in downstream modeling. Its modification is notable as the large language model tokenizer with an ability to combine both tokens that encode single characters (including single digits or single punctuation marks) and those that encode whole words (even the longest compound words). This modification, in the first step, assumes all unique characters to be an initial set of 1-character long n-grams (i.e. initial "tokens"). Then, successively, the most frequent pair of adjacent characters is merged into a new, 2-character long n-gram and all instances of the pair are replaced by this new token. This is repeated until a vocabulary of prescribed size is obtained. Note that new words can always be constructed from final vocabulary tokens and initial-set characters. This algorithmic approach has been extended from spoken language to sign language in recent years.
+```sh
+pip install smolbpe
+```
 
-All the unique tokens found in a corpus are listed in a token vocabulary, the size of which, in the case of GPT-3.5 and GPT-4, is 100256. 
+Alternatively, you can install it directly from the source code:
 
-![image](https://github.com/user-attachments/assets/27cf64e5-42a1-470b-baee-fc5a170bb4eb)
+```sh
+git clone https://github.com/T4ras123/SmolBPE.git
+cd SmolBPE
+pip install .
+```
+
+## Quick Start Guide
+
+### Using the Tokenizer in Python
+
+1.Importing the Tokenizer
+
+  ```python
+  from smolbpe.gpt4Tokenizer import GPT4Tokenizer
+  ```
+
+2.Initializing the Tokenizer
+
+  ```python
+  tokenizer = GPT4Tokenizer()
+  ```
+
+  You can specify a custom output file to save the vocab file to and regex pattern if needed:
+
+  ```python
+  tokenizer = GPT4Tokenizer(output='vocab.json', pattern=r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]")
+  ```
+
+3.Training the Tokenizer
+
+  Train the tokenizer on your dataset to build the vocabulary and merge rules:
+
+  ```python
+  with open("path_to_your_data", "r", encoding="utf-8") as f:
+      text = f.read()
+
+  tokenizer.train(text, vocab_size=400)
+  ```
+
+4.Encoding Text
+
+  Convert text into a list of token IDs:
+
+  ```python
+  encoded_tokens = tokenizer.encode("Tokenizing isn't real")
+  print(encoded_tokens)
+  ```
+
+5.Decoding Tokens
+
+Convert token IDs back into human-readable text:
+
+```python
+decoded_text = tokenizer.decode(encoded_tokens)
+print(decoded_text)
+```
+
+### Command-Line Interface
+
+SmolBPE provides a command-line interface for easy tokenization tasks.
+
+#### Training the Tokenizer
+
+```sh
+gpt4tokenizer --text data/taylorswift.txt --vocab_size 400 --output vocab.json
+```
+
+## Advanced Usage
+
+### Loading a Pre-trained Vocabulary
+
+If you have a pre-trained vocabulary and merges file, you can load them directly:
+
+```python
+tokenizer = GPT4Tokenizer()
+tokenizer.load_vocab('vocab.json')
+```
+
+### Custom Regex Pattern
+
+Customize the tokenization by providing a different regex pattern:
+
+```python
+custom_pattern = r"\w+|\s+|[^\s\w]+"
+tokenizer = GPT4Tokenizer(pattern=custom_pattern)
+```
+
+## Project Structure
+
+```sh
+SmolBPE/
+├── smolbpe/
+│   ├── __init__.py
+│   └── gpt4Tokenizer.py
+├── LICENSE
+├── MANIFEST.in
+├── README.md
+└── setup.py
+```
+
+## Contributing
+
+Contributions are welcome! To contribute:
+
+1. Fork the repository on GitHub.
+2. Create a new branch for your feature or bug fix.
+3. Commit your changes with descriptive commit messages.
+4. Push your branch to your forked repository.
+5. Open a pull request on the main repository.
+
+Please ensure your code adheres to the project's coding standards and includes appropriate tests.
+
+## License
+
+This project is licensed under the MIT License. You are free to use, modify, and distribute this software in accordance with the license.
+
+## Contact
+
+For any inquiries or feedback, please contact the author:
+
+- Author: Vover
+- Email: <vovatara123@gmail.com>
+- GitHub: [T4ras123](https://github.com/T4ras123)
+
+## Acknowledgments
+
+- Inspired by tokenization techniques used in GPT models.
+- Special thanks to the open-source community for continuous support.
+
+----
+Happy tokenizing with *SmolBPE*!
diff --git a/setup.py b/setup.py
index 42f0633..575ba49 100644
--- a/setup.py
+++ b/setup.py
@@ -2,11 +2,12 @@
 
 setup(
     name='smolbpe',
-    version='0.1.0',
+    version='0.2.0',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
+    long_description=open('README.md').read(),
     author='Vover',
     author_email='vovatara123@gmail.com',
-    url='https://github.com/T4ras123/SmolBPE',  # Replace with your repository URL
+    url='https://github.com/T4ras123/SmolBPE',
     packages=find_packages(include=['smolbpe', 'smolbpe.*']),
     install_requires=[
         'regex>=2021.4.4',
diff --git a/smolbpe/basicTokenizer.py b/smolbpe/basicTokenizer.py
deleted file mode 100644
index 136d5db..0000000
--- a/smolbpe/basicTokenizer.py
+++ /dev/null
@@ -1,84 +0,0 @@
-
-class BasicTokenizer():
-
-
-    def __init__(self):
-        self.vocab = {idx : bytes([idx]) for idx in range(256)}
-        self.merges = dict()
-        self.special_characters = []
-        self.decoded_text = "Pop"
-        self.encoded_text = []
-
-
-    def train(self, text, vocab_size, verbose = False):
-        tokens = self.tokenize(text)
-        steps = vocab_size - 256
-        for _ in range(steps):
-            bigrams = self.get_bigrams(tokens)
-            pair = max(bigrams, key=bigrams.get)
-            idx = 256 + _
-            tokens = self.merge(tokens, pair, idx)
-            self.merges[pair] = idx
-
-        for (p1,p2), idx in self.merges.items():
-            self.vocab[idx] = self.vocab[p1]+self.vocab[p2]
-        return tokens
-
-
-    def encode(self, text):
-        tokens = self.tokenize(text)
-        while len(tokens)>=2:
-            bigrams = self.get_bigrams(tokens)
-            pair = min(bigrams, key = lambda p: bigrams.get(p, float("inf")))
-            if pair not in self.merges:
-                break
-            idx = self.merges[pair]
-            tokens = self.merge(tokens, pair, idx)
-        self.encoded_text = tokens
-        return tokens
-
-
-    def decode(self, ids):
-        tokens = b"".join(self.vocab[idx] for idx in ids)
-        text = tokens.decode("utf-8", errors="replace")
-        self.decoded_text = text
-        return text
-
-
-    def get_bigrams(self, tokens):
-        bigrams = {}
-        for pair in zip(tokens, tokens[1:]):
-            bigrams[pair] = bigrams.get(pair, 0) + 1
-        return bigrams
-
-
-    def merge(self, text, pair, idx):
-        newids = []
-        id = 0 
-        while id<len(text):
-            if id<len(text)-1 and text[id]==pair[0] and text[id+1]==pair[1]:
-                newids.append(idx)
-                id+=2
-            else:
-                newids.append(text[id])
-                id+=1
-        return newids
-
-
-    def tokenize(self, text):
-        tokens = text.encode("utf-8")
-        tokens = list(tokens)
-        return tokens
-
-
-t = BasicTokenizer()
-
-with open("data/taylorswift.txt", "r") as f:
-    text = f.read()
-
-t.train(text, 400)
-print(t.merges)
-t.encode("Hello World Taylor Swift:    ")
-t.decode([72,101,108,108,111,32,87,111,114,108,100])
-print(t.encoded_text)
-print(t.decoded_text)
diff --git a/smolbpe/data/__init__.py b/smolbpe/data/__init__.py
deleted file mode 100644
index e69de29..0000000
diff --git a/smolbpe/data/taylorswift.txt b/smolbpe/data/taylorswift.txt
deleted file mode 100644
index e71aefb..0000000
--- a/smolbpe/data/taylorswift.txt
+++ /dev/null
@@ -1,988 +0,0 @@
-Copy paste of the Wikipedia article on Taylor Swift, as of Feb 16, 2024.
----
-
-Main menu
-
-WikipediaThe Free Encyclopedia
-
-Search
-Create account
-Log in
-
-Personal tools
-Contents  hide
-(Top)
-Life and career
-Toggle Life and career subsection
-Artistry
-Toggle Artistry subsection
-Accolades and achievements
-Cultural status
-Toggle Cultural status subsection
-Wealth
-Toggle Wealth subsection
-Discography
-Filmography
-Tours
-See also
-Footnotes
-References
-Toggle References subsection
-External links
-Taylor Swift
-
-136 languages
-Article
-Talk
-Read
-View source
-View history
-
-Tools
- Featured article
-Page semi-protected
-From Wikipedia, the free encyclopedia
-For the album, see Taylor Swift (album).
-Taylor Swift
-Portrait of Taylor Swift in a cocktail dress
-Swift at the 2023 MTV Video Music Awards
-Born	Taylor Alison Swift
-December 13, 1989 (age 34)
-West Reading, Pennsylvania, US
-Occupations
-Singer-songwriter producer director businesswoman actress
-Years active	2004–present
-Works
-Albumssinglessongsvideosperformances
-Relatives
-Austin Swift (brother)
-Marjorie Finlay (grandmother)
-Awards	Full list
-Musical career
-Origin	Nashville, Tennessee, US
-Genres
-Pop country folk rock alternative
-Instruments
-Vocals guitar banjo piano ukulele
-Labels
-RCA Republic Big Machine
-Website	www.taylorswift.com Edit this at Wikidata
-Signature
-
-Taylor Alison Swift (born December 13, 1989) is an American singer-songwriter. Her versatile artistry, songwriting, and entrepreneurship have influenced the music industry, popular culture, and politics, and her life is a subject of widespread media coverage.
-Swift began professional songwriting at 14 and signed with Big Machine Records in 2005 to become a country singer. She released six studio albums under the label, four of them to country radio, starting with Taylor Swift (2006). Her next, Fearless (2008), explored country pop, and its singles "Love Story" and "You Belong with Me" catapulted her to mainstream fame. Speak Now (2010) infused rock influences, while Red (2012) experimented with electronic elements and featured Swift's first Billboard Hot 100 number-one song, "We Are Never Ever Getting Back Together". She departed from her country image with 1989 (2014), a synth-pop album supported by the chart-topping songs "Shake It Off", "Blank Space", and "Bad Blood". Media scrutiny inspired the hip-hop-influenced Reputation (2017) and its number-one single "Look What You Made Me Do".
-After signing with Republic Records in 2018, Swift released the eclectic pop album Lover (2019) and the autobiographical documentary Miss Americana (2020). She explored indie folk styles on the 2020 albums Folklore and Evermore, subdued electropop on Midnights (2022), and re-recorded four albums subtitled Taylor's Version after a dispute with Big Machine. These albums spawned the number-one songs "Cruel Summer", "Cardigan", "Willow", "Anti-Hero", "All Too Well", and "Is It Over Now?". Her Eras Tour (2023–2024) and its accompanying concert film became the highest-grossing tour and concert film of all time, respectively. Swift has directed several music videos and films such as Folklore: The Long Pond Studio Sessions (2020) and All Too Well: The Short Film (2021).
-One of the world's best-selling musicians, with over 200 million records sold as of 2019, Swift has been named Global Recording Artist of the Year three times by the International Federation of the Phonographic Industry, whereas six of her albums have opened with over a million sales in a week. She is the highest-grossing female touring act, the most-streamed woman on Spotify and Apple Music, and the first billionaire with music as the main source of income. The 2023 Time Person of the Year, Swift has appeared on lists such as Rolling Stone's 100 Greatest Songwriters of All Time, Billboard's Greatest of All Time Artists, and Forbes' World's 100 Most Powerful Women. Her accolades include 14 Grammy Awards (featuring a record four Album of the Year wins), a Primetime Emmy Award, 40 American Music Awards, 40 Billboard Music Awards, and 23 MTV Video Music Awards.
-Life and career
-Early life
-
-Swift's childhood home in Wyomissing, Pennsylvania
-Taylor Alison Swift was born on December 13, 1989,[1] in West Reading, Pennsylvania.[2] She is named after singer-songwriter James Taylor.[3] Her father, Scott Kingsley Swift, is a former stockbroker for Merrill Lynch[4] and her mother, Andrea Gardner Swift (née Finlay), worked for a time as a mutual fund marketing executive.[5] Taylor has a younger brother, actor Austin Swift.[6]
-Swift's mother is of Scottish and German descent, and her father is of Scottish and English descent with distant Italian ancestry.[7][8] Swift's paternal great-great-grandfather, Charles Carmine Antonio Baldi, was an Italian immigrant entrepreneur and community leader who opened several businesses in Philadelphia in the 1800s.[9][10][8] Her maternal grandmother, Marjorie (née Moehlenkamp) Finlay, was an opera singer.[11]
-Swift spent her early years on a Christmas tree farm that her father had purchased from one of his clients.[12][13] She is a Christian.[14] She attended preschool and kindergarten at Alvernia Montessori School, run by Bernardine Franciscan sisters,[15] before transferring to the Wyndcroft School.[16] The family moved to a rented house in Wyomissing, Pennsylvania,[17] where Swift attended Wyomissing Area Junior/Senior High School.[18]
-At age nine, Swift became interested in musical theater and performed in four Berks Youth Theatre Academy productions.[19] She also traveled regularly to New York City for vocal and acting lessons.[20] Swift later shifted her focus toward country music, inspired by Shania Twain's songs, which made her "want to just run around the block four times and daydream about everything".[21] She spent weekends performing at local festivals and events.[22][23] After watching a documentary about Faith Hill, Swift felt she needed to move to Nashville, Tennessee, to pursue a career in music.[24] She traveled there with her mother at age eleven to visit record labels and submitted demo tapes of Dolly Parton and Dixie Chicks karaoke covers.[25] She was rejected, however, because "everyone in that town wanted to do what I wanted to do. So, I kept thinking to myself, I need to figure out a way to be different."[26] She spent summers in Stone Harbor, New Jersey until she was 14 years old, performing in a local coffee shop.[27][28]
-When Swift was around 12 years old, musician Ronnie Cremer taught her to play guitar. Cremer helped with her first efforts as a songwriter, leading her to write "Lucky You".[29] In 2003, Swift and her parents started working with New York–based talent manager Dan Dymtrow. With his help, Swift modeled for Abercrombie & Fitch as part of their "Rising Stars" campaign, had an original song included on a Maybelline compilation CD, and met with major record labels.[30] After performing original songs at an RCA Records showcase, Swift, then 13 years old, was given an artist development deal and began making frequent trips to Nashville with her mother.[31][32][33] To help Swift break into the country music scene, her father transferred to Merrill Lynch's Nashville office when she was 14 years old, and the family relocated to Hendersonville, Tennessee.[12][34] Swift attended Hendersonville High School[35] before transferring to Aaron Academy after two years, which better accommodated her touring schedule through homeschooling. She graduated one year early.[36][37]
-2004–2008: Career beginnings and first album
-In Nashville, Swift worked with experienced Music Row songwriters such as Troy Verges, Brett Beavers, Brett James, Mac McAnally, and the Warren Brothers[38][39] and formed a lasting working relationship with Liz Rose.[40] They began meeting for two-hour writing sessions every Tuesday afternoon after school.[41] Rose called the sessions "some of the easiest I've ever done. Basically, I was just her editor. She'd write about what happened in school that day. She had such a clear vision of what she was trying to say. And she'd come in with the most incredible hooks." Swift became the youngest artist signed by the Sony/ATV Tree publishing house,[42] but left then BMG-owned RCA Records (later bought by Sony Music) at the age of 14 due to the label's lack of care and them "cut[ting] other people's stuff". She was also concerned that development deals can shelve artists[33][23] and recalled: "I genuinely felt that I was running out of time. I wanted to capture these years of my life on an album while they still represented what I was going through."[43]
-Taylor Swift singing on a microphone and playing a guitar
-Swift opening for Brad Paisley in 2007. To promote her first album, she opened tours for other country musicians in 2007 and 2008.[44]
-At an industry showcase at Nashville's Bluebird Cafe in 2005, Swift caught the attention of Scott Borchetta, a DreamWorks Records executive who was preparing to form an independent record label, Big Machine Records. She had first met Borchetta in 2004.[45] She was one of Big Machine's first signings,[33] and her father purchased a three-percent stake in the company for an estimated $120,000.[46][47] She began working on her eponymous debut album with Nathan Chapman.[23] Swift wrote or co-wrote all album tracks, and co-writers included Rose, Robert Ellis Orrall, Brian Maher, and Angelo Petraglia.[48] Taylor Swift was released on October 24, 2006.[49] Country Weekly critic Chris Neal deemed Swift better than previous aspiring teenage country singers because of her "honesty, intelligence and idealism".[50] The album peaked at number five on the US Billboard 200, on which it spent 157 weeks—the longest stay on the chart by any release in the US in the 2000s decade.[51] Swift became the first female country music artist to write or co-write every track on a US platinum-certified debut album.[52]
-Big Machine Records was still in its infancy during the June 2006 release of the lead single, "Tim McGraw", which Swift and her mother helped promote by packaging and sending copies of the CD single to country radio stations. As there was not enough furniture at the label yet, they would sit on the floor to do so.[53] She spent much of 2006 promoting Taylor Swift with a radio tour and television appearances; she opened for Rascal Flatts on select dates during their 2006 tour,[54] as a replacement for Eric Church.[55] Borchetta said that although record industry peers initially disapproved of his signing a 15-year-old singer-songwriter, Swift tapped into a previously unknown market—teenage girls who listen to country music.[53][12]
-Following "Tim McGraw", four more singles were released throughout 2007 and 2008: "Teardrops on My Guitar", "Our Song", "Picture to Burn" and "Should've Said No". All appeared on Billboard's Hot Country Songs, with "Our Song" and "Should've Said No" reaching number one. With "Our Song", Swift became the youngest person to single-handedly write and sing a number-one song on the chart.[56] "Teardrops on My Guitar" reached number thirteen on the US Billboard Hot 100.[57] Swift also released two EPs, The Taylor Swift Holiday Collection in October 2007 and Beautiful Eyes in July 2008.[58][59] She promoted her debut album extensively as the opening act for other country musicians' tours in 2006 and 2007, including those by George Strait,[60] Brad Paisley,[61] and Tim McGraw and Faith Hill.[62]
-Swift won multiple accolades for Taylor Swift. She was one of the recipients of the Nashville Songwriters Association's Songwriter/Artist of the Year in 2007, becoming the youngest person given the title.[63] She also won the Country Music Association's Horizon Award for Best New Artist,[64] the Academy of Country Music Awards' Top New Female Vocalist,[65] and the American Music Awards' Favorite Country Female Artist honor.[66] She was also nominated for Best New Artist at the 50th Annual Grammy Awards.[67] In 2008, she opened for Rascal Flatts again[68] and briefly dated the singer Joe Jonas.[69][70]
-2008–2010: Fearless
-Taylor Swift in 2009
-Swift at the 2009 premiere of Hannah Montana: The Movie. She had a cameo appearance in the film and wrote two songs for its soundtrack.[71][72]
-Swift's second studio album, Fearless, was released on November 11, 2008, in North America,[73] and in March 2009 in other markets.[74] Critics lauded Swift's honest and vulnerable songwriting in contrast to other teenage singers.[75] Five singles were released in 2008–2009: "Love Story", "White Horse", "You Belong with Me", "Fifteen", and "Fearless". The first single peaked at number four on the Billboard Hot 100 and number one in Australia.[57][76] It was the first country song to top Billboard's Pop Songs chart.[77] "You Belong with Me" was the album's highest-charting single on the Billboard Hot 100, peaking at number two,[78] and was the first country song to top Billboard's all-genre Radio Songs chart.[79] All five singles were Hot Country Songs top-10 entries, with "Love Story" and "You Belong with Me" topping the chart.[80] Fearless became her first number-one album on the Billboard 200 and 2009's top-selling album in the US.[81] The Fearless Tour, Swift's first headlining concert tour, grossed over $63 million.[82] Journey to Fearless, a documentary miniseries, aired on television and was later released on DVD and Blu-ray.[83] Swift performed as a supporting act for Keith Urban's Escape Together World Tour in 2009.[84]
-In 2009, the music video for "You Belong with Me" was named Best Female Video at the 2009 MTV Video Music Awards.[85] Her acceptance speech was interrupted by rapper Kanye West,[86] an incident that became the subject of controversy, widespread media attention and Internet memes.[87] That year she won five American Music Awards, including Artist of the Year and Favorite Country Album.[88] Billboard named her 2009's Artist of the Year.[89] She won Video of the Year and Female Video of the Year for "Love Story" at the 2009 CMT Music Awards, where she made a parody video of the song with rapper T-Pain called "Thug Story".[90] At the 52nd Annual Grammy Awards, Fearless was named Album of the Year and Best Country Album, and "White Horse" won Best Country Song and Best Female Country Vocal Performance. Swift was the youngest artist to win Album of the Year.[note 1] At the 2009 Country Music Association Awards, Swift won Album of the Year for Fearless and was named Entertainer of the Year, the youngest person to win the honor.[93]
-Swift featured on John Mayer's single "Half of My Heart" and Boys Like Girls' single "Two Is Better Than One", the latter of which she co-wrote.[94][95] She co-wrote and recorded "Best Days of Your Life" with Kellie Pickler,[96] and wrote two songs for the Hannah Montana: The Movie soundtrack—"You'll Always Find Your Way Back Home" and "Crazier".[72] She contributed two songs to the Valentine's Day soundtrack, including the single "Today Was a Fairytale", which was her first number-one on the Canadian Hot 100 and peaked at number two on the US Hot 100.[97][98] While shooting her film debut Valentine's Day in October 2009, Swift dated co-star Taylor Lautner.[99] In 2009, she made her television debut as a rebellious teenager in an CSI: Crime Scene Investigation episode,[100] and she hosted and performed as the musical guest on Saturday Night Live; she was the first host ever to write their own opening monologue.[101][102]
-2010–2014: Speak Now and Red
-Swift singing into a mic while playing a banjo
-Swift performing at the Speak Now World Tour in 2012
-In August 2010, Swift released "Mine", the lead single from her third studio album, Speak Now. The single entered the Hot 100 at number three.[103] Swift wrote the album alone and co-produced every track.[104] The album was released on October 25, 2010,[105] opening atop the Billboard 200 with over one million copies sold.[106] It became the fastest-selling digital album by a female artist, with 278,000 downloads in a week.[107] Critics appreciated Swift's grown-up perspectives:[108] Rob Sheffield of Rolling Stone wrote, "in a mere four years, the 20-year-old Nashville firecracker has put her name on three dozen or so of the smartest songs released by anyone in pop, rock or country."[109] "Back to December", "Mean", "The Story of Us", "Sparks Fly", and "Ours" became subsequent singles, with the latter two reaching number one on the Hot Country Songs[80] and the first two peaking in the top ten in Canada.[98] She dated actor Jake Gyllenhaal in 2010.[110]
-At the 54th Annual Grammy Awards in 2012, Swift won Best Country Song and Best Country Solo Performance for "Mean", which she performed during the ceremony.[111] Swift won other awards for Speak Now, including Songwriter/Artist of the Year by the Nashville Songwriters Association (2010 and 2011),[112][113] Woman of the Year by Billboard (2011),[114] and Entertainer of the Year by the Academy of Country Music (2011 and 2012)[115] and the Country Music Association in 2011.[116] At the American Music Awards of 2011, Swift won Artist of the Year and Favorite Country Album.[117] Rolling Stone named Speak Now amongst its "50 Best Female Albums of All Time" (2012), writing: "She might get played on the country station, but she's one of the few genuine rock stars we've got these days, with a flawless ear for what makes a song click."[118]
-The Speak Now World Tour ran from February 2011 to March 2012 and grossed over $123 million,[119] followed up by the live album, Speak Now World Tour: Live.[120] She contributed two original songs to The Hunger Games soundtrack album: "Eyes Open" and "Safe & Sound", co-written and recorded with the Civil Wars and T-Bone Burnett. "Safe & Sound" won the Grammy Award for Best Song Written for Visual Media and was nominated for the Golden Globe Award for Best Original Song.[121][122] Swift featured on B.o.B's single "Both of Us", released in May 2012.[123] She dated Conor Kennedy that year.[124]
-Taylor Swift on the Red Tour
-Swift on the Red Tour (2013)
-In August 2012, Swift released "We Are Never Ever Getting Back Together", the lead single from her fourth studio album, Red. It became her first number one single in the US and New Zealand,[125][126] and became the fastest-selling single in digital history.[127] Other singles from the album were "Begin Again", "I Knew You Were Trouble", "22", "Everything Has Changed", "The Last Time", and "Red". "I Knew You Were Trouble" reached the top five on charts in Australia, Canada, Denmark, Ireland, New Zealand, the UK and the US.[128] "Begin Again", "22", and "Red" reached the top 20 in the US.[57] On Red, released on October 22, 2012,[129] Swift worked with Chapman and Rose, as well as the new producers Max Martin and Shellback.[130] It incorporated many pop and rock styles such as heartland rock, dubstep and dance-pop.[131] Randall Roberts of Los Angeles Times said Swift "strives for something much more grand and accomplished" with Red.[132] It opened at number one on the Billboard 200 with 1.21 million sales.[133] Red was Swift's first number-one album in the UK.[134] It earned several accolades, including four nominations at the 56th Annual Grammy Awards (2014).[135] Swift received American Music Awards for Best Female Country Artist in 2012, Artist of the Year in 2013,[136][137] and the Nashville Songwriters Association's Songwriter/Artist Award for the fifth and sixth consecutive years.[138] The Red Tour ran from March 2013 to June 2014 and grossed over $150 million, becoming the highest-grossing country tour ever.[139] Swift was honored with the Pinnacle Award, making her the second recipient of the accolade after Garth Brooks.[140] During this time, she briefly dated the English singer Harry Styles.[141]
-In 2013, Swift recorded "Sweeter than Fiction", a song she wrote and produced with Jack Antonoff for the One Chance soundtrack. The song received a Best Original Song nomination at the 71st Golden Globe Awards.[142] She provided guest vocals for Tim McGraw's song "Highway Don't Care", also featuring Keith Urban.[143] Swift performed "As Tears Go By" with the Rolling Stones in Chicago, Illinois, as part of the band's 50 & Counting tour,[144] and joined Florida Georgia Line at their set at the 2013 Country Radio Seminar to sing "Cruise".[145] Swift voiced Audrey in the animated film The Lorax (2012),[146] made a cameo in the sitcom New Girl (2013),[147] and had a supporting role in the dystopian film The Giver (2014).[148]
-2014–2018: 1989 and Reputation
-Swift performing on a mic, dressed in a blue skirt
-Swift at the 1989 World Tour, the highest-grossing tour of 2015
-In March 2014, Swift began living in New York City.[note 2] She hired Tree Paine as her publicist[151] and worked on her fifth studio album, 1989, with the producers Jack Antonoff, Max Martin, Shellback, Imogen Heap, Ryan Tedder, and Ali Payami.[152] She promoted the album extensively, including inviting fans to secret album-listening sessions.[153] 1989 was released on October 27, 2014, and opened atop the Billboard 200 with 1.28 million copies sold.[154] Its singles "Shake It Off", "Blank Space" and "Bad Blood" reached number one in Australia, Canada and the US, the first two making Swift the first woman to replace herself at the Hot 100 top spot;[155] other singles include "Style", "Wildest Dreams", "Out of the Woods" and "New Romantics".[156] The 1989 World Tour (2015) was the highest-grossing tour of the year with $250 million in total revenue.[157]
-Prior to 1989's release, Swift stressed the importance of albums to artists and fans.[158] In November 2014, she removed her entire catalog from Spotify, arguing that its ad-supported, free service undermined the premium service, which provides higher royalties for songwriters.[159] In a June 2015 open letter, Swift criticized Apple Music for not offering royalties to artists during the streaming service's free three-month trial period and stated that she would pull 1989 from the catalog.[160] The following day, Apple Inc. announced that it would pay artists during the free trial period,[161] and Swift agreed to let 1989 on the streaming service.[162] She then returned her entire catalog plus 1989 to Spotify, Amazon Music and Google Play and other digital streaming platforms in June 2017.[163] Swift was named Billboard's Woman of the Year in 2014, becoming the first artist to win the award twice.[164] At the 2014 American Music Awards, Swift received the inaugural Dick Clark Award for Excellence.[165] On her 25th birthday in 2014, the Grammy Museum at L.A. Live opened an exhibit in her honor in Los Angeles that ran until October 4, 2015, and broke museum attendance records.[166][167] In 2015, Swift won the Brit Award for International Female Solo Artist.[168] The video for "Bad Blood" won Video of the Year and Best Collaboration at the 2015 MTV Video Music Awards.[169] At the 58th Grammy Awards (2016), 1989 won Album of the Year and Best Pop Vocal Album, making Swift the first woman and fifth act overall to win Album of the Year twice.[170]
-Swift wearing a sparkling blazer singing on a mic
-Swift on her Reputation Stadium Tour (2018), the highest-grossing North American tour ever
-Swift dated the Scottish DJ Calvin Harris from March 2015 to June 2016.[171] They co-wrote the song "This Is What You Came For", featuring vocals from the Barbadian singer Rihanna; Swift was initially credited under the pseudonym Nils Sjöberg.[172] In April 2016, Swift criticized the lyrics of Kanye West's single "Famous", in which he sings "I made that bitch famous" in reference to his interruption of her acceptance speech at the 2009 MTV Video Music Awards. West claimed he had received her approval for the line, and his then-wife Kim Kardashian released video clips of Swift and West discussing the single amicably over the phone; a full recording leaked in 2020 established that West did not disclose that he would call her a "bitch".[173][174]
-After briefly dating the English actor Tom Hiddleston,[175] Swift entered a six-year relationship with the English actor Joe Alwyn in September 2016.[176][177][178] She wrote the song "Better Man" for the band Little Big Town, which earned her the Song of the Year award at the 51st CMA Awards.[179] Swift and English singer Zayn Malik released the joint single "I Don't Wanna Live Forever" for Fifty Shades Darker: Original Motion Picture Soundtrack (2017). The song reached number two in the US.[180]
-In August 2017, Swift successfully countersued David Mueller, a former radio jockey for KYGO-FM, who sued her for damages from loss of employment. Four years earlier, she informed Mueller's bosses that he had sexually assaulted her by groping her at an event.[181] Also that month, after a one-year hiatus from the spotlight, Swift cleared her social media accounts and released "Look What You Made Me Do" as the lead single from her sixth album, Reputation.[182][183] The single was Swift's first UK number-one single.[184] It topped charts in Australia, Ireland, New Zealand, and the US.[185] Reputation, released on November 10, 2017,[186] incorporated electropop, hip hop, R&B, and EDM.[187] Reviews praised Swift's mature artistry, but some denounced the themes of fame and gossip.[188] The album opened atop the Billboard 200 with 1.21 million US sales[189] and topped the charts in the UK, Australia, and Canada.[190] Its singles "...Ready for It?", "End Game" (featuring Ed Sheeran and Future), and "Delicate" were released to pop radio.[191] Reputation was nominated for a Grammy Award for Best Pop Vocal Album.[192] Swift featured on the country duo Sugarland's "Babe" (2018).[193]
-At the 2018 American Music Awards, Swift won four awards, which made her accumulate 23 trophies in total and become the AMAs' most awarded female musician, surpassing Whitney Houston.[194] The same year, she embarked on her Reputation Stadium Tour,[195] which became the highest-grossing North American concert tour in history and grossed $345.7 million worldwide.[196]
-2018–2020: Lover, Folklore, and Evermore
-In November 2018, she signed a new deal with the Universal Music Group; her subsequent releases were promoted by Republic Records. Swift said the contract included a provision for her to maintain ownership of her masters. In addition, in the event that Universal sold any part of its stake in Spotify, it agreed to distribute a non-recoupable portion of the proceeds among its artists.[197] Vox called it a huge commitment from Universal, which was "far from assured" until Swift intervened.[198]
-A portrait of Swift
-Swift at the American Music Awards of 2019, where she was named Artist of the Decade
-Swift's first album with Republic Records, Lover, was released on August 23, 2019.[199] Besides Antonoff, she worked with Louis Bell, Frank Dukes, and Joel Little.[200] Lover was her sixth consecutive album to sell more than 500,000 US copies in one week.[201] Critics commended the album's free-spirited mood and emotional intimacy.[202][203] The singles "Me!" and "You Need to Calm Down" both peaked at number two on the Hot 100,[204] and other singles were the top-10 single "Lover", the top-40 single "The Man",[57] and the 2023 resurgent success, chart topper "Cruel Summer".[205] Lover was the world's best-selling album by a solo artist of 2019,[206] and along with its singles earned nominations at the 62nd Annual Grammy Awards in 2020.[207] At the 2019 MTV Video Music Awards, "Me!" won Best Visual Effects, and "You Need to Calm Down" won Video of the Year and Video for Good. Swift was the first female and second artist overall to win Video of the Year for a video that they directed.[208]
-While promoting Lover, Swift became embroiled in a public dispute with the talent manager Scooter Braun and Big Machine over the purchase of the masters of her back catalog.[209][210] Swift said she had been trying to buy the masters, but Big Machine would only allow her to do so if she exchanged one new album for each older one under a new contract, which she refused to sign.[209][211] Swift began re-recording her back catalog in November 2020.[212] Besides music, she played Bombalurina in the film adaptation of Andrew Lloyd Webber's musical Cats (2019), for which she co-wrote and recorded the Golden Globe-nominated original song "Beautiful Ghosts".[213][214] Critics panned the film but praised Swift's performance.[215] The documentary Miss Americana, which chronicled parts of Swift's life and career, premiered at the 2020 Sundance Film Festival.[216] Swift signed a global publishing deal with Universal Music Publishing Group in February 2020 after her 16-year contract with Sony/ATV expired.[217]
-Amidst the COVID-19 pandemic in 2020, Swift surprise-released two "sister albums" that she recorded with Antonoff and Aaron Dessner: Folklore on July 24, and Evermore on December 11.[218][219] Alwyn co-wrote and co-produced a few songs under the pseudonym William Bowery.[220] Both explore indie folk with a more muted production compared to her previous upbeat pop songs[221][222] and earned Swift widespread critical acclaim and artistic recognition.[223][224] Each album was supported by three singles catering to US pop, country, and triple A radio formats. The singles were "Cardigan", "Betty", and "Exile" from Folklore, and "Willow", "No Body, No Crime", and "Coney Island" from Evermore.[225] Folklore made Swift the first woman to win the Grammy Award for Album of the Year three times at the 63rd Annual Grammy Awards[226] and was the best-selling album of 2020 in the US.[227] Swift became the first artist to debut a US number-one album and a number-one song at the same time with Folklore's "Cardigan".[228] At the 2020 American Music Awards, she won three awards, including Artist of the Year for a record third consecutive time.[229] According to Billboard, she was 2020's highest-paid musician in the US and highest-paid solo musician worldwide.[230]
-2020–2023: Re-recordings and Midnights
-
-Swift performing in 2022
-Following the masters dispute, Swift released re-recordings of her first six studio albums, beginning with Fearless (Taylor's Version) and Red (Taylor's Version) in April and November 2021, respectively. Both peaked atop the Billboard 200,[231] and the former was the first re-recorded album to do so.[232] Fearless (Taylor's Version) was preceded by "Love Story (Taylor's Version)", which made her the second artist after Dolly Parton to have both the original and re-recorded versions of a song reach number one on the Hot Country Songs chart.[233] Red (Taylor's Version) was supported by "All Too Well (10 Minute Version)", which became the longest song in history to top the Hot 100.[234] The song was accompanied by a short film, which won a Grammy Award for Best Music Video[235] and Swift's record third MTV Video Music Award for Video of the Year.[236]
-Swift's tenth studio album, Midnights, was released on October 21, 2022.[237] Characterized by a restrained electropop[238][239] and synth-pop[240] sound, the album was dubbed by Rolling Stone critics as an instant classic.[241][242] The album was her fifth to open atop the Billboard 200 with first-week sales of over one million copies and broke various sales and streaming records,[243] including the most single-day streams and most single-week streams on Spotify.[244] Its tracks, led by single "Anti-Hero", monopolized the top 10 of the Hot 100, making Swift the first artist to do so.[245] Two other singles, "Lavender Haze" and "Karma", peaked at number two on the Hot 100.[246] Swift won nine awards at the 2023 MTV Video Music Awards, including Video of the Year ("Anti-Hero") for a record fourth time.[247] At the 66th Annual Grammy Awards, she received Best Pop Vocal Album, and her fourth Album of the Year—the most for any artist.[248]
-Swift released the third re-recorded album, Speak Now (Taylor's Version), on July 7, 2023, becoming the woman with the most number-one albums (12) in Billboard 200 history, surpassing Barbra Streisand.[249] 1989 (Taylor's Version), released on October 27, 2023, became Swift's record-extending sixth album to sell one million copies in a single week in the US and surpassed Midnights for her career's largest album sales week.[250] Its single "Is It Over Now?" debuted atop the Billboard Hot 100. Swift was 2023's most streamed artist on Spotify,[251] Apple Music,[252] and Amazon Music;[253] the first act to place number one on the year-end Billboard top artists list in three different decades (2009, 2015 and 2023);[254] and the first living artist to simultaneously chart five albums in the top 10 of the Billboard 200.[255] She had five out of the 10 best-selling albums of 2023 in the United States, a record since Luminate began tracking US music sales in 1991.[256][257]
-Beyond her albums, Swift featured on five songs from 2021 to 2023: "Renegade" and "Birch" by Big Red Machine,[258] a remix of "Gasoline" by Haim,[259] "The Joker and the Queen" by Ed Sheeran,[260] and "The Alcott" by the National.[261] For the soundtrack of the 2022 film Where the Crawdads Sing, she recorded "Carolina", which received nominations for Best Original Song at the Golden Globes and Best Song Written for Visual Media at the Grammy Awards.[262] Outside of music, Swift had a supporting role in the 2022 period comedy film Amsterdam and has signed to direct an upcoming feature film for Searchlight Pictures.[263][264]
-2023–present: The Eras Tour and The Tortured Poets Department
-Swift singing into a mic
-Swift on the Eras Tour in 2023
-In March 2023, Swift embarked on the Eras Tour, a retrospective tour covering all her studio albums. Media outlets extensively covered the tour's cultural and economic impact,[265] and its US leg broke the record for the most tickets sold in a day.[245] Ticketmaster received public and political criticisms for mishandling the tour's ticket sales.[266] The Eras Tour became the highest-grossing tour in history, collecting over $1 billion.[267][268] Its concert film, released to theaters worldwide on October 13, 2023, grossed over $250 million to become the highest-grossing concert film, and was nominated for the Golden Globe Award for Cinematic and Box Office Achievement.[269][270] Swift's music releases, touring, and related activities culminated in an unprecedented height of popularity post-pandemic.[271] Music Business Worldwide remarked that she entered a "new stratosphere of global career success" in 2023.[272]
-Swift began dating Kansas City Chiefs' tight end Travis Kelce in 2023.[273] In January 2024, AI-generated fake pornographic images portraying Swift were posted to X (formerly Twitter) and spread to other social media platforms, spurring criticism and demands for legal reform.[274][275] At the 66th Grammy Awards, Swift announced her eleventh studio album, The Tortured Poets Department, set for release on April 19, 2024.[248][276]
-Artistry
-Influences
-One of Swift's earliest memories of music is listening to her maternal grandmother, Marjorie Finlay, sing in church.[5] As a child, she enjoyed Disney film soundtracks: "My parents noticed that, once I had run out of words, I would just make up my own."[277] Swift said she owes her confidence and "fascination with writing and storytelling" to her mother, who helped her prepare for class presentations as a child.[278][279]
-Swift was drawn to the storytelling aspect of country music,[280] which was introduced to the genre by female country artists of the 1990s: Shania Twain, Faith Hill, and the Dixie Chicks.[281][282] Twain, both as a songwriter and performer, was her biggest musical influence.[283] Hill was Swift's childhood role model, and she would often imitate her.[284] She admired the Chicks' defiant attitude and the way they played their instruments,[285] and was also influenced by older country stars like Patsy Cline, Loretta Lynn, Tammy Wynette, and Dolly Parton,[22] the last of whom she believes is exemplary to female songwriters.[114] As a songwriter, Swift was influenced by Joni Mitchell's emotional and autobiographical lyrics, highlighting Mitchell's 1971 album Blue as a favorite "because it explores somebody's soul so deeply".[286] She also spoke of influence from 1990s songwriters such as Melissa Etheridge, Sarah McLachlan, and Alanis Morissette,[287][288] and alt-country artists like Patty Griffin[289] and Lori McKenna.[290]
-Various pop and rock artists have also influenced Swift. She lists Paul McCartney, Bruce Springsteen, Emmylou Harris, and Kris Kristofferson as her career role models.[12][291] 1989 was influenced by some of her favorite 1980s pop acts, including Peter Gabriel, Annie Lennox, Phil Collins, and Madonna.[292][293] She also cited Keith Urban's musical style and Fall Out Boy's lyrics as major influences.[294][295]
-Genres
-"If there's one thing that Swift has proven throughout her career, it's that she refuses to be put in a box. Her ever-evolving sound took her from country darling to pop phenom to folk's newest raconteur."
-—The Recording Academy, 2021[296]
-Swift is known for venturing into various music genres and undergoing artistic reinventions,[297][264] having been described as a "music chameleon".[298][299] She self-identified as a country musician until 2012, when she released her fourth studio album, Red.[300] Her albums were promoted to country radio, but music critics noted wide-ranging styles of pop and rock[301][302] and said that the melodies of her songs were rooted in pop, and the country music elements were limited to instruments such as banjo, mandolin, and fiddle, and her slight twang.[303][304] Some commented that her country music identity was an indicator of her narrative songwriting rather than musical style.[305][306] Although the Nashville music industry was receptive of Swift's status as a country musician, critics accused her of abandoning her roots in favor of crossover success in mainstream pop.[307][308] Red's eclectic pop, rock, and electronic styles intensified the critical debate, to which Swift responded, "I leave the genre labeling to other people."[309]
-Music journalist Jody Rosen commented that by originating her musical career in Nashville, Swift made a "bait-and-switch maneuver, planting roots in loamy country soil, then pivoting to pop".[310] She abandoned her country music identity in 2014 with the release of her synth-pop fifth studio album, 1989. Swift described it as her first "documented, official pop album".[311] Her subsequent albums Reputation (2017) and Lover (2019) have an upbeat pop production; the former incorporates hip hop, trap, and EDM elements.[312][313][314] Midnights (2022), on the other hand, is distinguished by a more experimental, "subdued and amorphous pop sound".[315][316] Although reviews of Swift's pop albums were generally positive, some critics lamented that the pop music production indicated Swift's pursuit of mainstream success, eroding her authenticity as a songwriter nurtured by her country music background—a criticism that has been retrospectively described as rockist.[317][318] Musicologist Nate Sloan remarked that Swift's pop music transition was rather motivated by her need to expand her artistry.[319] Swift eschewed mainstream pop in favor of alternative, folk and indie rock styles with her 2020 studio albums Folklore and Evermore.[320][321] Clash said her career "has always been one of transcendence and covert boundary-pushing", reaching a point at which "Taylor Swift is just Taylor Swift", not defined by any genre.[322]
-Voice
-
-"Cardigan"
-Duration: 22 seconds.0:22
-Swift uses her lower register in "Cardigan" (2020).[323]
-"Lavender Haze"
-Duration: 18 seconds.0:18
-"Lavender Haze" (2022) features Swift's falsetto vocals in the refrain.[324]
-Problems playing these files? See media help.
-Swift possesses a mezzo-soprano vocal range,[325] and a generally soft but versatile timbre.[326][327] As a country singer, her vocals were criticized by some as weak and strained compared to those of her contemporaries.[328] Swift admitted her vocal ability often concerned her in her early career and has worked hard to improve.[329] Reviews of her vocals remained mixed after she transitioned to pop music with 1989; critics complained that she lacked proper technique but appreciated her usage of her voice to communicate her feelings to the audience, prioritizing "intimacy over power and nuance".[330] They also praised her for refraining from correcting her pitch with Auto-Tune.[331]
-The Los Angeles Times remarked that Swift's defining vocal feature is her attention to detail to convey an exact feeling—"the line that slides down like a contented sigh or up like a raised eyebrow".[332] With Reputation, critics noted she was "learning how to use her voice as a percussion instrument of its own",[333] swapping her "signature" expressive vocals for "cool, conversational, detached" cadences and rhythms similar to hip hop and R&B styles.[334][335][336] Alternative Press stated that her "evocative" vocal stylings are more reminiscent of pop-punk and emo genres.[337]
-Reviews of Swift's later albums and performances were more appreciative of her vocals, finding them less nasal, richer, more resonant, and more powerful.[304][338][339] With Folklore and Evermore, Swift received praise for her sharp and agile yet translucent and controlled voice.[340][341][342] Pitchfork described it as "versatile and expressive".[343] With her 2021 re-recorded albums, critics began to praise the mature, deeper and "fuller" tone of her voice.[344][345][346] An i review said Swift's voice is "leagues better now".[347] The Guardian highlighted "yo-yoing vocal yelps" and passionate climaxes as the trademarks of Swift's voice,[348] and that her country twang faded away.[349] Midnights received acclaim for Swift's nuanced vocal delivery.[350] She ranked 102nd on the 2023 Rolling Stone list of the 200 Greatest Singers of All Time.[327] In a review of the Eras Tour, The New Yorker critic Amanda Petrusich praised the clarity and tone of Swift's live vocals.[351] Musicologist Alyssa Barna said that Swift's timbre is "breathy and bright" in her upper register and "full and dark" in the lower.[222]
-Songwriting
-Further information: List of songs by Taylor Swift
-Swift has been referred to as one of the greatest songwriters ever by several publications.[352][353][354] Literature scholars like Jonathan Bate and Stephanie Burt have noted that her literary and melodic sensibility and writing style are rare amongst her peers.[355][356] Swift's bridges are often noted as one of the best aspects of her songs,[357][358] earning her the title "Queen of Bridges" from Time.[359] Mojo described her as "a sharp narrator with a gift for the extended metaphor".[360]
-In The New Yorker in 2011, Swift said she identifies as a songwriter first: "I write songs, and my voice is just a way to get those lyrics across".[12] Her personal experiences were a common inspiration for her early songs, which helped her navigate life.[361][362] Her "diaristic" technique began with identifying an emotion, followed by a corresponding melody.[363][364] On her first three studio albums, love, heartbreak, and insecurities, from an adolescent perspective, were dominant themes.[365][366] She delved into the tumult of toxic relationships on Red,[367] and embraced nostalgia and post-romance positivity on 1989.[292] Reputation was inspired by the downsides of Swift's fame,[368] and Lover detailed her realization of the "full spectrum of love".[369] Other themes in Swift's music include family dynamics, friendship,[370][371] alienation, self-awareness, and tackling vitriol, especially sexism.[279][372]
-Her confessional lyrics received positive reviews from critics,[373][12][374] who highlighted their vivid details and emotional engagement, which they found uncommon in pop music.[375][376][377] Critics also praised her melodic compositions; Rolling Stone described Swift as "a songwriting savant with an intuitive gift for verse-chorus-bridge architecture".[378][379] NPR dubbed Swift "a master of the vernacular in her lyrics",[335] remarking that her songs offer emotional engagement because "the wit and clarity of her arrangements turn them from standard fare to heartfelt disclosures".[379] Despite the positive reception, The New Yorker stated she was generally portrayed "more as a skilled technician than as a Dylanesque visionary".[12] Tabloid media often speculated and linked the subjects of her songs with her ex-lovers, a practice reviewers and Swift herself criticized as sexist.[380][381][382] Aside from clues in album liner notes, Swift avoided talking about the subjects of her songs.[383]
-On her 2020 albums Folklore and Evermore, Swift was inspired by escapism and romanticism to explore fictional narratives.[384] She imposed emotions onto imagined characters and story arcs, which liberated her from tabloid attention and suggested new paths for her artistry.[363] Swift explained that she welcomed the new songwriting direction after she stopped worrying about commercial success.[384] According to Spin, she explored complex emotions with "precision and devastation" on Evermore.[385] Consequence stated her 2020 albums convinced skeptics of her songwriting prowess, noting her transformation from "teenage wunderkind to a confident and careful adult".[358]
-Swift divides her writing into three types: "quill lyrics", songs rooted in antiquated poeticism; "fountain pen lyrics", based on modern and vivid storylines; and "glitter gel pen lyrics", which are lively and frivolous.[386] Critics note the fifth track of every Swift album as the most "emotionally vulnerable" of the album.[387] Awarding her with the Songwriter Icon Award in 2021, the National Music Publishers' Association remarked that "no one is more influential when it comes to writing music today".[388] The Week deemed her the foremost female songwriter of modern times,[389] and the Nashville Songwriters Association International named her Songwriter-Artist of the Decade in 2022.[245] Swift has also published two original poems: "Why She Disappeared" and "If You're Anything Like Me".[390]
-Performances
-Further information: List of Taylor Swift live performances
-
-Swift performing on the Reputation Stadium Tour in Seattle in May 2018
-Journalists have described Swift as one of the best live performers. Often praised for her showmanship and stage presence,[391][392][393][394][395] Swift commands large audiences,[396][397][398] without having to rely on dance like her contemporaries do.[399] According to V magazine's Greg Krelenstein, she possesses "a rare gift of turning a stadium spectacle into an intimate setting", irrespective of whether she is "plucking a guitar or leading an army of dancers".[400] In a 2008 review of Swift's early performances, Sasha Frere-Jones of The New Yorker called Swift a "preternaturally skilled" entertainer with a vibrant stage presence, adding "she returned the crowd's energy with the professionalism she has shown since the age of fourteen."[401] In 2023, Adrian Horton of The Guardian noted her "seemingly endless stamina" on the Eras Tour,[402] and i critic Ilana Kaplan called her showmanship "unparalleled".[403]
-Critics have highlighted Swift's versatility as an entertainer, praising her ability to switch onstage personas and performance styles depending on the varying themes and aesthetics of her albums.[404][405] Her concert productions have been characterized by elaborate Broadway theatricality and high technology,[406] and her performances frequently incorporate a live band, with whom she has played and toured since 2007.[407] Swift also often accompanies herself with musical instruments such as electric guitar;[408] acoustic guitar; piano;[409] and sometimes twelve-string guitar,[410][411] banjo,[412] or ukulele.[413] Interacting frequently with the audience, her solo acoustic performances are considered intimate and emotionally resonant, complementing her story-based lyrics and fan connection.[351][414] Lydia Burgham of The Spinoff opined that this intimacy remains "integral to her singer-songwriter origins".[415][409] Chris Willman of Variety called Swift "pop's most approachable superstar",[416] and the 21st century's most popular performer.[417]
-Video and film
-Further information: Taylor Swift videography
-Swift emphasizes visuals as a key creative component of her music-making process.[418] She has collaborated with different directors to produce her music videos, and over time she has become more involved with writing and directing. She developed the concept and treatment for "Mean" in 2011[419] and co-directed the music video for "Mine" with Roman White the year before.[420] In an interview, White said that Swift "was keenly involved in writing the treatment, casting and wardrobe. And she stayed for both the 15-hour shooting days, even when she wasn't in the scenes."[421]
-From 2014 to 2018, Swift collaborated with director Joseph Kahn on eight music videos—four each from her albums 1989 and Reputation. Kahn has praised Swift's involvement.[422] She worked with American Express for the "Blank Space" music video (which Kahn directed), and served as an executive producer for the interactive app AMEX Unstaged: Taylor Swift Experience, for which she won a Primetime Emmy Award for Outstanding Interactive Program in 2015.[423] Swift produced the music video for "Bad Blood" and won a Grammy Award for Best Music Video in 2016.[424]
-Her production company, Taylor Swift Productions, is credited with producing all of her visual media starting with the 2018 concert documentary Reputation Stadium Tour.[425] She continued to co-direct music videos for the Lover singles "Me!" with Dave Meyers, and "You Need to Calm Down" (also serving as a co-executive producer) and "Lover" with Drew Kirsch,[426] but first ventured into sole direction with the video for "The Man" (which won her the MTV Video Music Award for Best Direction).[427] After Folklore: The Long Pond Studio Sessions, Swift debuted as a filmmaker with All Too Well: The Short Film,[245] which made her the first artist to win the Grammy Award for Best Music Video as a sole director.[428] Swift has cited Chloé Zhao, Greta Gerwig, Nora Ephron, Guillermo del Toro, John Cassavetes, and Noah Baumbach as filmmaking influences.[418]
-Accolades and achievements
-Further information: List of awards and nominations received by Taylor Swift
-
-In 2009, Swift became the first country singer to win an MTV Video Music Award.
-Swift's discography is a "critically hailed songbook", as per Time's Sam Lansky.[429] She has won 14 Grammy Awards (including four for Album of the Year—the most won by an artist),[430] an Emmy Award,[431] 40 American Music Awards (the most won by an artist),[432] 39 Billboard Music Awards (the most won by an artist—tying with Drake),[433] 118 Guinness World Records,[434] 23 MTV Video Music Awards (including four Video of the Year wins—the most by an act),[247] 12 Country Music Association Awards (including the Pinnacle Award),[435] eight Academy of Country Music Awards,[436] and two Brit Awards.[168] As a songwriter, she has been honored by the Nashville Songwriters Association,[63][437] the Songwriters Hall of Fame, and the National Music Publishers' Association and was the youngest person on Rolling Stone's list of the 100 Greatest Songwriters of All Time in 2015.[438][439] At the 64th BMI Awards in 2016, Swift was the first woman to be honored with an award named after its recipient.[440]
-Commercially, from available data, Swift has amassed over 50 million album sales and 150 million single sales as of 2019,[441][442][443] and 114 million units globally, including 78 billion streams as of 2021.[444][445] The International Federation of the Phonographic Industry ranked her as the Global Recording Artist of the Year for a record three times (2014, 2019 and 2022).[446] Swift has the most number-one albums in the United Kingdom and Ireland for a female artist this millennium,[447][448] earned the highest income for an artist on Chinese digital music platforms (RMB 159,000,000 as of 2021),[449] and is the first artist to replace themselves at the top spot and occupy the entire top five[note 3] of the Australian albums chart.[452][453] Swift remains the world's highest-grossing female touring act ever, with cumulative ticket sales at $1.96 billion as of November 2023 according to Pollstar.[454] The Eras Tour is the highest-grossing tour of all time as of December 2023, and the first to surpass $1 billion in revenue.[455] Beginning with Fearless, each of her studio albums have opened with over one million global units.[456][457] Swift is the most streamed female act on Spotify and Apple Music.[458][459] On Spotify, she is the only artist to have received more than 200 and 250 million streams in one day (260 million on October 27, 2023),[460] and the only female act to reach 100 million monthly listeners.[234] The most entries and the most simultaneous entries for an artist on the Billboard Global 200, with 143 and 31 songs, respectively, are among her feats.[461][462]
-In the US, Swift has sold over 37.3 million albums as of 2019,[443] when Billboard placed her eighth on its Greatest of All Time Artists Chart.[463] Eleven of her songs have topped the Billboard Hot 100.[257] She is the longest-reigning act of the Billboard Artist 100 (97 weeks);[464] the soloist with the most cumulative weeks atop the Billboard 200 (68);[465] the woman with the most Billboard 200 number-ones (13),[234] Hot 100 entries (232),[234][156] number-one debuts (6),[note 4] top-ten songs (49),[257] and weeks atop the Top Country Albums chart (101);[467] and the act with the most number-one songs on Pop Airplay (12) and Digital Songs (28).[468][469] Swift is the first woman to simultaneously chart five albums in the top 10 and eleven albums on the entire Billboard 200;[470][471] and the first act to occupy the top four spots and chart seven albums[note 5] in the top 10 on the Top Album Sales chart.[473][474] She is the second highest-certified female digital singles artist (and fifth overall) in the US, with 137.5 million total units certified by the Recording Industry Association of America (RIAA),[475] and the first woman to have both an album (Fearless) and a song ("Shake It Off") certified Diamond.[476] Swift is the only artist in Luminate history to have six albums sell over a million copies in a week.[477]
-Swift has appeared in various power listings. Time included her on its annual list of the 100 most influential people in 2010, 2015, and 2019.[478] She was one of the "Silence Breakers" that the magazine spotlighted as Person of the Year in 2017 for speaking up about sexual assault,[479] and received the honor again in 2023 for her cultural domination that year.[429] Time described Swift as the first Person of the Year to be recognized for "achievement in the arts", as well as the first woman to be recognized and appear on a Person of the Year cover more than once.[480][481] In 2014, she was named to Forbes' 30 Under 30 list in the music category[482] and again in 2017 in its "All-Star Alumni" category.[483] Swift became the youngest woman to be included on Forbes' list of the 100 most powerful women in 2015, ranked at number 64.[484] In 2023, she was ranked by Forbes as the fifth-most powerful woman in the world, the first entertainer to place in the top five.[485] Swift received an honorary Doctor of Fine Arts degree from New York University and served as its commencement speaker on May 18, 2022.[245]
-Cultural status
-Main articles: Cultural impact of Taylor Swift and Public image of Taylor Swift
-
-Swift at the 2010 Time 100 Gala
-Swift has been credited with making a profound impact on the music industry, popular culture and the economy.[486][487] She dominates cultural conversations,[488][489] which has led publications to describe her as a cultural "vitality" or zeitgeist.[490][491][492] Her music, life and public image are points of attention in global celebrity culture.[297] Initially a teen idol,[493] she has been referred to as a pop icon;[312][494] publications describe her immense popularity and longevity as unwitnessed since the 20th century.[495][496] In 2013, New York magazine's Jody Rosen dubbed Swift the "world's biggest pop star" and opined that the trajectory of her stardom has defied established patterns. Rosen added that Swift "falls between genres, eras, demographics, paradigms, trends", leaving her contemporaries "vying for second place".[310] Critics regard Swift as a rare yet successful combination of the pop star and singer-songwriter archetypes.[497]
-Her fans are known as Swifties.[266] Billboard noted only few artists have had her chart success, critical acclaim, and fan support.[498] Swift's million-selling albums are considered an anomaly in the streaming-dominated industry following the end of the album era in the 2010s.[499][500] Economist Alan Krueger described Swift as an "economic genius".[501]
-Although labeled by the media in her early career as "America's Sweetheart" for her girl next door persona,[502][503] Swift has been accused by detractors of being "calculated" and manipulative of her image, a narrative bolstered by her 2016 dispute with West.[173][174] Critics have also noted that her personal life and career have been subject to intense misogyny and "slut-shaming",[504][505] as well as rampant media scrutiny and tabloid speculation.[506]
-Swift's private jet use has drawn scrutiny for its carbon emissions.[507][508] In 2023, a spokesperson for Swift stated that she had purchased more than double the required carbon credits to offset all tour travel and personal flights.[509][510] In December 2023, Swift's lawyers sent a cease and desist letter to American programmer Jack Sweeney over tracking her private jet, citing safety concerns and stalking.[511][512] Swift has been a victim of numerous house break-ins and stalkers, some of whom were armed.[513][514]
-Legacy
-"You have different artists dominating different sectors of the industry: Some are huge at streaming, some are big draws on the road. But we're at this moment where there's no one better than Taylor Swift, whether that's on the radio, with streaming, ticket sales or just cultural impact."
-– Jason Lipshutz, Billboard executive director, 2023[515]
-Swift helped shape the modern country music scene,[516] having extended her success beyond the Anglosphere,[310][516] pioneered the use of internet (Myspace) as a marketing tool,[33][53] and introduced the genre to a younger generation.[517][310] Country labels have since become interested in signing young singers who write their own music;[518] her guitar performances contributed to the "Taylor Swift factor", a phenomenon to which an upsurge in guitar sales to women, a previously ignored demographic, is attributed.[519][520]
-According to publications, Swift changed the music landscape with her genre transitions, a discography that accommodates cultural shifts,[521] and her ability to popularize any sound in mainstream music.[522] Lyrically, in being personal and vulnerable in her songs, music journalist Nick Catucci opined Swift helped make space for later singers like Billie Eilish, Ariana Grande, and Halsey to do the same.[523] Scholars have highlighted the literary sensibility and poptimist implications of Swift.[355][524] She has been credited with legitimizing and popularizing the concept of album "eras".[525][526] Swift is a subject of academic study and scholarly media research.[297] Various educational institutions offer courses on Swift in literary, cultural and sociopolitical contexts.[527][297]
-Swift has influenced numerous music artists, and her albums have inspired a generation of singer-songwriters.[517][320][528] Journalists praise her ability to reform industry practices, noting how her actions changed streaming policies, prompted awareness of intellectual property in new musicians,[529][530] and reshaped ticketing models.[531] Various sources deem Swift's music a paradigm representing the millennial generation;[532] Vox called her the "millennial Bruce Springsteen",[533] and The Times named her "the Bob Dylan of our age".[534] Swift earned the title Woman of the Decade (2010s) from Billboard,[535] Artist of the Decade (2010s) at the American Music Awards,[536] and Global Icon at the Brit Awards for her impact.[445] Senior artists such as Paul McCartney,[537] Mick Jagger,[538] Madonna,[539] and Dolly Parton have praised her musicianship.[540] Carole King regards Swift her "professional grand daughter" and thanked Swift for "carrying the torch forward".[541] Springsteen called her a "tremendous" writer,[542] while Ringo Starr and Billy Joel considered Swift the Beatles' successor.[543][544] Britney Spears labeled Swift "the most iconic pop woman of our generation".[545]
-Entrepreneurship
-Media outlets describe Swift as a savvy businesswoman;[546][547] in 2024, she topped Billboard's annual Power 100 ranking of the top music industry executives.[548] Swift is known for her traditional album rollouts, consisting of a variety of promotional activities that Rolling Stone termed as an inescapable "multimedia bonanza".[549][550] Easter eggs and cryptic teasers became a common practice in contemporary pop music because of Swift.[551] Publications describe her discography as a music "universe" subject to analyses by fans, critics and journalists.[552][553][554] Swift maintains an active presence on social media and a close relationship with fans, to which many journalists attribute her success.[555][487][556] Her in-house management team is called 13 Management.[557]
-Swift has endorsed many brands and businesses, having launched clothing lines with L.E.I. and Stella McCartney,[558][559] designed American Greetings cards and Jakks Pacific dolls,[560][561] released a number of fragrances with Elizabeth Arden,[562] and signed multi-year deals with AT&T and Capital One.[563][564] She was a spokesperson for the National Hockey League's Nashville Predators and Sony Cyber-shot digital cameras,[565][566] and became the global ambassador for New York City in 2014 and Record Store Day in 2022.[567][568]
-Social activism
-Further information: Political impact of Taylor Swift
-Swift identifies as a pro-choice feminist,[569] and is a founding signatory of the Time's Up movement against sexual harassment.[570] Specifically, she criticized the US Supreme Court's decision to end federal abortion rights in 2022.[571] Swift also advocates for LGBT rights,[572] and has called for the passing of the Equality Act, which prohibits discrimination based on sex, sexual orientation, and gender identity.[573][574] She performed during WorldPride NYC 2019 at the Stonewall Inn, a gay rights monument, and has donated to the LGBT organizations Tennessee Equality Project and GLAAD.[575][576][577]
-A supporter of the March for Our Lives movement and gun control reform in the US,[578] Swift is a vocal critic of white supremacy, racism, and police brutality.[579][569] Following the George Floyd protests, she donated to the NAACP Legal Defense and Educational Fund and the Black Lives Matter movement,[580] called for the removal of Confederate monuments in Tennessee,[581] and advocated for Juneteenth to become a national holiday.[582] In 2020, Swift urged her fans to check their voter registration ahead of elections, which resulted in 65,000 people registering to vote within one day of her post,[583] and endorsed Joe Biden and Kamala Harris in the US presidential election.[584] She has openly criticized former president Donald Trump.[585]
-Wealth
-Swift's net worth is estimated by Forbes and Bloomberg News at $1.1 billion as of October 2023, making her the first musician to achieve billionaire status "solely based on her songs and performances".[586][587] Forbes named her the annual top-earning female musician in 2016, 2019, 2021, and 2022.[588] She was the highest-paid celebrity of 2016 with $170 million—a feat recognized by the Guinness World Records as the highest annual earnings ever for a female musician,[589] which she herself surpassed with $185 million in 2019.[590] Overall, Forbes listed Swift as the highest-paid female artist of the 2010s, earning $825 million.[591] She has also developed a real estate portfolio worth $150 million as of 2023, with properties in Nashville; Tribeca, Manhattan; Los Angeles (Samuel Goldwyn Estate); and Rhode Island (High Watch).[592]
-Philanthropy
-Swift is known for her philanthropic efforts.[593] She ranked first on DoSomething's 2015 "Gone Good" list,[594] having received the Star of Compassion from the Tennessee Disaster Services and the Big Help Award from the Nickelodeon Kids' Choice Awards for her "dedication to helping others" and "inspiring others through action".[595][596] She donated $100,000 to the Red Cross to help the victims of the Iowa flood of 2008.[597] In 2009, she sang at BBC's Children in Need concert and raised £13,000 for the cause.[598] Swift has performed at charity relief events, including Sydney's Sound Relief concert.[599] In response to the May 2010 Tennessee floods, Swift donated $500,000.[600] In 2011, Swift used a dress rehearsal of her Speak Now tour as a benefit concert for victims of recent tornadoes in the US, raising more than $750,000.[601] In 2016, she donated $1 million to Louisiana flood relief efforts and $100,000 to the Dolly Parton Fire Fund.[602][603] Swift donated to food banks after Hurricane Harvey struck Houston in 2017 and at every stop of the Eras Tour in 2023;[604][605] she also directly employed local businesses throughout the tour and gave $55 million in bonus payments to her entire crew.[606][607] Swift donated $1 million for Tennessee tornado relief in 2020 and again in 2023.[608][609]
-She is a supporter of the arts. A benefactor of the Nashville Songwriters Hall of Fame,[610] Swift has donated $75,000 to Nashville's Hendersonville High School to help refurbish the school auditorium,[611] $4 million to build a new education center at the Country Music Hall of Fame and Museum in Nashville,[612] $60,000 to the music departments of six US colleges,[613] and $100,000 to the Nashville Symphony.[614] Also a promoter of children's literacy, she has donated money and books to schools around the country.[615][616] In 2007, Swift partnered with the Tennessee Association of Chiefs of Police to launch a campaign to protect children from online predators.[617] She has donated items to several charities for auction, including the UNICEF Tap Project and MusiCares.[618] As recipient of the Academy of Country Music's Entertainer of the Year in 2011, Swift donated $25,000 to St. Jude Children's Research Hospital, Tennessee.[619] In 2012, Swift participated in the Stand Up to Cancer telethon, performing the charity single "Ronan", which she wrote in memory of a four-year-old boy who died of neuroblastoma.[620] She has also donated $100,000 to the V Foundation for Cancer Research[621] and $50,000 to the Children's Hospital of Philadelphia.[622] Swift has encouraged young people to volunteer in their local communities as part of Global Youth Service Day.[623]
-Swift donated to fellow singer-songwriter Kesha to help with her legal battles against Dr. Luke and to actress Mariska Hargitay's Joyful Heart Foundation.[593][624] During the COVID-19 pandemic, Swift donated to the World Health Organization and Feeding America,[625] and supported independent record stores.[626][627] Swift performed "Soon You'll Get Better" on the One World: Together At Home television special, a benefit concert curated by Lady Gaga for Global Citizen to raise funds for the World Health Organization's COVID-19 Solidarity Response Fund.[628] In 2018 and 2021, Swift donated to the Rape, Abuse & Incest National Network in honor of Sexual Assault Awareness and Prevention Month.[593][629] She has made donations to her fans several times for their medical or academic expenses.[630] In December 2023, Swift attended Ramy Youssef's fundraiser for the Gaza Strip.[631]
-Discography
-Main articles: Taylor Swift albums discography, Taylor Swift singles discography, and List of songs by Taylor Swift
-Studio albums
-Taylor Swift (2006)
-Fearless (2008)
-Speak Now (2010)
-Red (2012)
-1989 (2014)
-Reputation (2017)
-Lover (2019)
-Folklore (2020)
-Evermore (2020)
-Midnights (2022)
-The Tortured Poets Department (2024)
-Re-recorded albums
-Fearless (Taylor's Version) (2021)
-Red (Taylor's Version) (2021)
-Speak Now (Taylor's Version) (2023)
-1989 (Taylor's Version) (2023)
-Filmography
-Main article: Taylor Swift videography
-This section lists select works only. Refer to the main article for further information.
-Valentine's Day (2010)
-The Lorax (2012)
-The Giver (2014)
-Cats (2019)
-All Too Well: The Short Film (also director) (2021)
-Amsterdam (2022)
-Documentary and concert films
-Journey to Fearless (2010)
-Speak Now World Tour – Live (2011)
-The 1989 World Tour Live (2015)
-Taylor Swift: Reputation Stadium Tour (2018)
-Miss Americana (2020)
-Taylor Swift: City of Lover (2020)
-Folklore: The Long Pond Studio Sessions (also director) (2020)
-Taylor Swift: The Eras Tour (2023)
-Tours
-Main article: List of Taylor Swift live performances
-Fearless Tour (2009–2010)
-Speak Now World Tour (2011–2012)
-The Red Tour (2013–2014)
-The 1989 World Tour (2015)
-Reputation Stadium Tour (2018)
-The Eras Tour (2023–2024)
-See also
-List of American Grammy Award winners and nominees
-List of highest-certified music artists in the United States
-List of most-followed Instagram accounts
-List of most-followed Twitter accounts
-List of most-subscribed YouTube channels
-Footnotes
- Swift held the record until the 62nd Annual Grammy Awards in 2020.[91][92]
- Though Swift has properties throughout the US, she identifies Nashville as her home.[149][150]
- Swift has occupied the top five of the ARIA Albums Chart twice. She achieved this feat first on the issue published on July 7, 2023,[450] followed by a second time on the issue published on February 9, 2024.[451]
- In a tie with Ariana Grande.[466]
- Swift has charted seven titles in the top 10 of the Top Album Sales chart twice—on the issues dated January 6, 2024, and January 20, 2024.[472]
-References
- "Taylor Swift: The record-breaking artist in numbers". Newsround. March 2, 2020. Archived from the original on March 8, 2020. Retrieved April 20, 2020.
- Sutherland, Mark (May 23, 2015). "Taylor Swift interview: 'A relationship? No one's going to sign up for this'". The Daily Telegraph. Archived from the original on January 10, 2022. Retrieved April 20, 2020.
- Scott, Walter (June 11, 2015). "What Famous Pop Star Is Named After James Taylor?". Parade. Archived from the original on October 15, 2016. Retrieved December 12, 2018.
- "Taylor Swift is not an "underdog": The real story about her 1 percent upbringing that the New York Times won't tell you". Salon.com. May 23, 2015. Archived from the original on May 25, 2022. Retrieved December 26, 2020.
- Jepson 2013, p. 1.
- Roth, Madeline (May 19, 2015). "Taylor Swift's Brother Had The Most Epic Graduation Weekend Ever". MTV News. Archived from the original on July 23, 2016. Retrieved July 25, 2016.
- McKay, Gabriel (July 6, 2023). "Taylor Swift Edinburgh: Is star the real queen of Scotland?". The Herald. Archived from the original on February 1, 2024. Retrieved February 4, 2024.
- Eleftheriou-Smith, Loulla-Mae (June 24, 2015). "Taylor Swift tells Scotland: 'I am one of you'". The Independent. Archived from the original on May 26, 2022. Retrieved July 10, 2019.
- Vadala, Nick (July 14, 2017). "Taylor Swift ancestor's home added to Philly Register of Historic Places". The Philadelphia Inquirer. Archived from the original on May 25, 2022. Retrieved January 15, 2021.
- "Taylor Swift's Great-Great-Grandfather's Philly Home Gets Historic Landmark Status". AP NEWS. July 25, 2017. Archived from the original on May 22, 2022. Retrieved January 15, 2021.
- "Taylor Swift stammt aus dem Freistaat" (in German). BR24. September 17, 2015. Archived from the original on December 31, 2021. Retrieved July 23, 2023.
- Widdicombe, Lizzie (October 10, 2011). "You Belong With Me". The New Yorker. Archived from the original on July 24, 2014. Retrieved October 11, 2011.
- Raab, Scott (October 20, 2014). "Taylor Swift Interview". Esquire. Archived from the original on February 16, 2015. Retrieved April 11, 2015.
- "Taylor Swift on Politicians Co-opting Faith: 'I'm a Christian. That's Not What We Stand For'". Relevant. January 31, 2020. Archived from the original on November 25, 2022. Retrieved April 2, 2020.
- Uhrich, Bill (February 13, 2010). "Photos Students at Alvernia Montessori School sending Taylor Swift a valentine". Reading Eagle. Archived from the original on October 16, 2013. Retrieved February 25, 2013.
- Hatza, George (December 8, 2008). "Taylor Swift: Growing into superstardom". Reading Eagle. Archived from the original on April 1, 2012. Retrieved April 17, 2012.
- Mennen, Lauren (November 12, 2014). "Taylor Swift's Wyomissing childhood home on the market for $799,500". Philadelphia Daily News. Archived from the original on October 17, 2016. Retrieved October 13, 2016.
- Chang, David (February 22, 2016). "Taylor Swift Returns to Reading Pennsylvania as Maid of Honor in Friend's Wedding". WCAU. Archived from the original on September 16, 2016. Retrieved August 26, 2016.
- "Taylor Swift, Age 12". New York Daily News. Archived from the original on August 27, 2016. Retrieved August 26, 2016.
- Cooper, Brittany Joy (April 15, 2012). "Taylor Swift Opens Up About a Future in Acting and Admiration for Emma Stone". Taste of Country. Archived from the original on April 17, 2012. Retrieved April 17, 2012.
- MacPherson, Alex (October 18, 2012). "Taylor Swift: 'I want to believe in pretty lies'". The Guardian. Archived from the original on August 26, 2016. Retrieved August 3, 2016.
- Rolling Stone Interview: The Unabridged Taylor Swift, December 2, 2008
- Morris, Edward (December 1, 2006). "When She Thinks 'Tim McGraw', Taylor Swift Savors Payoff: Hardworking Teen to Open for George Strait Next Year". CMT. Archived from the original on June 26, 2015. Retrieved March 11, 2010.
- Diu, Nisha Lilia (April 3, 2011). "Taylor Swift: 'I won't do sexy shoots'". The Daily Telegraph. Archived from the original on May 6, 2013. Retrieved April 17, 2012.
- "News : CMT Insider Interview: Taylor Swift (Part 1 of 2)". CMT. November 26, 2008. Archived from the original on January 23, 2015. Retrieved July 1, 2012.
- Malec, Jim (May 2, 2011). "Taylor Swift: The Garden In The Machine". American Songwriter. Archived from the original on May 10, 2012. Retrieved May 21, 2012.
- Qureshi, Hira. "Visit this Stone Harbor café where Taylor Swift was 'always coming in to play' as a child". Courier-Post. Archived from the original on October 26, 2023. Retrieved December 12, 2022.
- Kuperinsky, Amy (July 28, 2020). "Taylor Swift shouts out Jersey Shore town in video for surprise album". NJ.com. Archived from the original on December 12, 2022. Retrieved December 12, 2022.
- Martino, Andy (January 10, 2015). "EXCLUSIVE: The real story of Taylor Swift's guitar 'legend'". New York Daily News. Archived from the original on November 22, 2015. Retrieved August 28, 2017.
- "Dymtrow v. Swift et al: Federal Civil LawsuitNew York Southern District Court, Case No. 1:07-cv-11277-RJS" (PDF). American Bar Association. Archived from the original (PDF) on October 11, 2012. Retrieved April 18, 2012.
- "On tour with Taylor Swift". NBC News. May 31, 2009. Archived from the original on October 5, 2013. Retrieved July 1, 2012.
- Castro, Vicky (February 6, 2015). "How to Succeed as an Entrepreneur, Taylor Swift Style". Inc. Archived from the original on June 7, 2016. Retrieved February 9, 2015.
- Willman, Chris (July 25, 2007). "Getting to know Taylor Swift". Entertainment Weekly. Archived from the original on May 24, 2022. Retrieved January 25, 2022.
- Jo, Nancy (January 2, 2014). "Taylor Swift and the Growing of a Superstar: Her Men, Her Moods, Her Music". Vanity Fair. Archived from the original on November 10, 2015. Retrieved November 11, 2015.
- "News : Taylor Swift's High School Names Auditorium in Her Honor". CMT. September 23, 2010. Archived from the original on November 21, 2014. Retrieved April 18, 2012.
- Grigoriadis, Vanessa (March 5, 2009). "The Very Pink, Very Perfect Life of Taylor Swift". Rolling Stone. Archived from the original on May 3, 2019. Retrieved July 28, 2019.
- "Taylor Swift receives her high school diploma". Houston Chronicle. July 27, 2008. Archived from the original on January 1, 2024. Retrieved January 2, 2024.
- "Taylor Swift: The Garden In The Machine". American Songwriter. May 2, 2011. Archived from the original on August 7, 2013. Retrieved May 21, 2012.
- "Songwriter Taylor Swift Signs Publishing Deal With Sony/ATV". Broadcast Music, Inc. May 12, 2005. Archived from the original on December 4, 2012. Retrieved April 20, 2012.
- Kosser, Michael (June 3, 2010). "Liz Rose: Co-Writer to the Stars". American Songwriter. Archived from the original on December 24, 2011. Retrieved April 19, 2012.
- Leahey, Andrew (October 24, 2014). "Songwriter Spotlight: Liz Rose". Rolling Stone. Archived from the original on September 26, 2016. Retrieved September 24, 2016.
- DeLuca, Dan (November 11, 2008). "Focused on 'great songs' Taylor Swift isn't thinking about 'the next level' or Joe Jon as gossip". Philadelphia Daily News. p. 1. Archived from the original on November 18, 2012. Retrieved April 17, 2012.
- Preston, John (April 26, 2009). "Taylor Swift: the 19-year-old country music star conquering America – and now Britain". The Daily Telegraph. Archived from the original on January 5, 2012. Retrieved August 30, 2012.
- Rosa, Christopher (March 24, 2015). "Opening Acts Who Became Bigger Than The Headliner". VH1. Archived from the original on November 10, 2015. Retrieved November 11, 2015.
- Rapkin, Mickey (July 27, 2017). "Oral History of Nashville's Bluebird Cafe: Taylor Swift, Maren Morris, Dierks Bentley & More on the Legendary Venue". Billboard. Archived from the original on July 29, 2017. Retrieved July 28, 2017.
- Hiatt, Brian (October 25, 2012). "Taylor Swift in Wonderland". Rolling Stone. Archived from the original on July 31, 2016. Retrieved August 1, 2016.
- Greenburg, Zack O'Malley (June 26, 2013). "Toby Keith, Cowboy Capitalist: Country's $500 Million Man". Forbes. Archived from the original on August 27, 2016. Retrieved August 1, 2016.
- Taylor Swift (CD). Big Machine Records. 2006. BMR120702.
- Tamarkin, Jeff. "Taylor Swift – Taylor Swift". AllMusic. Archived from the original on October 20, 2015. Retrieved February 14, 2021.
- Neal, Chris (December 4, 2006). "Taylor Swift Review". Country Weekly. Archived from the original on July 22, 2012. Retrieved March 31, 2010.
- Trust, Gary (October 29, 2009). "Chart Beat Thursday: Taylor Swift, Tim McGraw Linked Again". Billboard. Archived from the original on March 7, 2013. Retrieved November 8, 2016.
- "Taylor Swift". Songwriters' Hall of Fame. Archived from the original on February 12, 2021. Retrieved September 21, 2022.
- Willman, Chris (February 5, 2008). "Taylor Swift's Road to Fame". Entertainment Weekly. p. 3. Archived from the original on February 21, 2015. Retrieved April 22, 2012.
- "Taylor Swift Joins Rascal Flatts Tour". CMT. October 18, 2006. Archived from the original on January 7, 2015. Retrieved March 11, 2010.
- Whitaker, Sterling; Hammar, Ania (May 27, 2019). "How Eric Church's Rascal Flatts Feud Helped Launch Taylor Swift's Career". Taste of Country. Townsquare Media. Archived from the original on June 6, 2019. Retrieved June 10, 2019.
- "Taylor Swift No. 1 on iTunes". Great American Country. December 19, 2007. Archived from the original on March 3, 2012. Retrieved July 5, 2010.
- "Taylor Swift – Chart history". Billboard. Archived from the original on August 9, 2016. Retrieved July 26, 2016.
- "Taylor Swift owns top of country chart". Country Standard Time. July 23, 2008. Archived from the original on July 31, 2008. Retrieved December 26, 2008.
- "Wal-Mart "Eyes" New Taylor Swift Project". Great American Country. Archived from the original on July 23, 2008. Retrieved July 24, 2008.
- "Taylor Swift Joins George Strait's 2007 Tour". CMT. November 17, 2006. Archived from the original on August 11, 2017. Retrieved February 16, 2020.
- "Brad Paisley Plans Tour With Three Opening Acts". CMT. January 9, 2007. Archived from the original on August 11, 2017. Retrieved February 16, 2020.
- "Taylor Swift Joins Tim McGraw, Faith Hill on Tour". CMT. June 1, 2007. Archived from the original on August 11, 2017. Retrieved February 16, 2020.
- "Taylor Swift Youngest Winner of Songwriter/Artist Award". Great American Country. October 16, 2007. Archived from the original on January 11, 2015. Retrieved February 2, 2015.
- "Photos : All Taylor Swift Pictures : Horizon Award Winner Poses in the Pressroom". CMT. September 7, 2007. Archived from the original on November 13, 2012. Retrieved May 21, 2012.
- "Photos : 43rd Annual ACM Awards – Onstage: Winners : Acceptance Speech". CMT. May 18, 2008. Archived from the original on November 13, 2012. Retrieved May 21, 2012.
- "Taylor Swift, Rascal Flatts, Carrie Underwood Score at 2008 AMA Awards" (Blog). Roughstock.com. November 24, 2008. Archived from the original on July 10, 2014. Retrieved May 21, 2012.
- "Amy Winehouse Wins Best New Artist, Kanye West Pays Tribute to Mom – Grammy Awards 2008, Grammy Awards". People. October 2, 2008. Archived from the original on November 13, 2012. Retrieved May 21, 2012.
- "Rascal Flatts Announce Summer Tour With Taylor Swift". CMT. May 5, 2008. Archived from the original on April 18, 2022. Retrieved June 5, 2019.
- Caplan, David (September 8, 2008). "Scoop". People. Archived from the original on February 2, 2016. Retrieved March 6, 2012.
- Rizzo, Monica (November 24, 2008). "Scoop – Couples, Camilla Belle, Joe Jonas". People. Archived from the original on March 3, 2016. Retrieved March 6, 2012.
- Akers, Shelley (June 9, 2008). "Taylor Swift to Appear in Hannah Montana Movie". People. Archived from the original on October 27, 2017. Retrieved October 27, 2017.
- "Hannah Montana: The Movie (Original Motion Picture Soundtrack) by Hannah Montana". iTunes Store. January 2009. Archived from the original on May 2, 2016. Retrieved August 2, 2016.
- "CD Taylor Swift – Fearless" (in Portuguese). Universal Music Group. Archived from the original on January 18, 2021. Retrieved February 14, 2021.
- Raphael, Amy (February 1, 2009). "First, she conquered Nashville. Now she's set for world domination". The Observer. ProQuest 250507223. Archived from the original on December 9, 2022. Retrieved December 9, 2022.
- Widdicombe, Lizzie (October 10, 2011). "You Belong with Me". The New Yorker. Archived from the original on July 24, 2014. Retrieved July 24, 2014.
- "Discography Taylor Swift". ARIA Charts. Archived from the original on March 21, 2012. Retrieved January 2, 2010.
- Trust, Gary (December 15, 2009). "Best of 2009: Part 1". Billboard. Archived from the original on March 3, 2013. Retrieved September 20, 2022.
- Ben-Yehuda, Ayala (August 13, 2009). "Black Eyed Peas, Jason Mraz Tie Records on Billboard Hot 100". Billboard. Archived from the original on May 8, 2013. Retrieved March 13, 2010.
- Trust, Gary (September 24, 2009). "Taylor Swift Climbs Hot 100, Black Eyed Peas Still No. 1". Billboard. Archived from the original on February 1, 2013. Retrieved September 20, 2022.
- "Taylor Swift Chart History (Hot Country Songs)". Billboard. Archived from the original on January 31, 2021. Retrieved February 14, 2021.
- Grein, Paul (March 16, 2012). "Chart Watch Extra: Top Albums Of Last 10 Years" (Blog). Yahoo! Music. Archived from the original on April 2, 2015. Retrieved June 10, 2011.
- Mapes, Jillian (November 23, 2010). "Taylor Swift Announces 'Speak Now' World Tour". Billboard. Archived from the original on May 8, 2013. Retrieved May 15, 2012.
- Weiss, Dan (December 12, 2011). "Taylor Swift: Journey To Fearless DVD". American Songwriter. Archived from the original on August 15, 2016. Retrieved August 2, 2016.
- Ryan, Sarah (August 10, 2009). "Taylor Swift Pranks Keith Urban" (Blog). Great American Country. Archived from the original on September 6, 2015. Retrieved November 11, 2015.
- "Kanye calls Taylor Swift after 'View' appearance". MSNBC. September 15, 2009. Archived from the original on October 6, 2013. Retrieved September 16, 2009.
- "Taylor Swift Thanks "Gracious" Beyonce for Inviting Her Onstage After Kanye Stunt at VMAs". Rolling Stone. September 14, 2009. Archived from the original on June 15, 2012. Retrieved May 15, 2012.
- Anderson, Kyle (September 16, 2009). "Kanye West's VMA Interruption Gives Birth To Internet Photo Meme". MTV. Archived from the original on January 16, 2016. Retrieved October 3, 2009.
- Ditzian, Eric (2009). "Taylor Swift, Michael Jackson Big Winners at American Music Awards". MTV. Archived from the original on September 8, 2014. Retrieved May 15, 2012.
- "2009 Artists of the Year". Billboard. December 10, 2009. Archived from the original on January 6, 2010. Retrieved May 21, 2012.
- "Taylor Swift Raps 'Thug Story' With T-Pain On CMT Awards". MTV. June 17, 2009. Archived from the original on May 25, 2022. Retrieved November 11, 2015.
- Kreps, Daniel (February 1, 2010). "Beyonce, Taylor Swift Dominate 2010 Grammy Awards". Rolling Stone. Archived from the original on February 15, 2012. Retrieved February 13, 2012.
- "Billie Eilish replaces Taylor Swift as youngest artist to win a Grammy for Album of the Year". MSN. January 27, 2020. Archived from the original on November 20, 2020. Retrieved September 1, 2020.
- Kaufman, Gil (November 12, 2009). "Taylor Swift Dominates CMA Awards". MTV News. Archived from the original on March 6, 2016. Retrieved September 13, 2016.
- Vena, Jocelyn (November 6, 2009). "John Mayer Talks Taylor Swift Collaboration 'Half of My Heart'". MTV. Archived from the original on September 8, 2014. Retrieved May 15, 2012.
- "Boys Like Girls featuring Taylor Swift, 'Two Is Better Than One'". Billboard. December 2, 2009. Archived from the original on August 18, 2021. Retrieved December 4, 2020.
- "Kellie Pickler Has Her 'Best Days' Thanks To Taylor Swift". MTV. Archived from the original on January 1, 2016. Retrieved November 11, 2015.
- Vena, Jocelyn (December 28, 2009). "New Taylor Swift Song Included In 'Valentine's Day' Featurette". MTV. Archived from the original on January 16, 2016. Retrieved November 11, 2015.
- "Taylor Swift – Chart history on Canadian Hot 100". Billboard. Archived from the original on August 9, 2016. Retrieved August 3, 2016.
- Park, Michael Y.; Sia, Nicole (December 29, 2009). "Taylor & Taylor Romance Was Overblown, Says Source". People. Archived from the original on November 13, 2012. Retrieved March 6, 2012.
- Caramanica, Jon (March 6, 2009). "OMG! Taylor Swift Does 'CSI'!". The New York Times (Blog). Archived from the original on August 14, 2011. Retrieved May 7, 2012.
- Strecker, Erin (January 2, 2015). "Remember When Taylor Swift Shined as 'Saturday Night Live' Host?". Billboard. Archived from the original on January 24, 2015. Retrieved January 15, 2015.
- Dukes, Billy (October 22, 2012). "10 Things You Didn't Know About Taylor Swift". Taste of Country. Townsquare Media. Archived from the original on May 22, 2022. Retrieved July 26, 2020.
- Pietroluongo, Silvio (August 11, 2010). "Taylor Swift Makes Sparkling Hot 100 Entrance". Billboard. Archived from the original on January 31, 2016. Retrieved July 25, 2016.
- Caramanica, Jon (October 20, 2010). "Taylor Swift, Angry on 'Speak Now'". The New York Times. Archived from the original on October 21, 2010. Retrieved October 23, 2010.
- "Taylor Swift's New Album, Speak Now, Set for Oct. 25 Release". CMT. July 20, 2010. Archived from the original on June 21, 2019. Retrieved February 14, 2020.
- Kaufman, Gil (November 3, 2010). "Taylor Swift's Speak Now Tops 1 Million in First Week". MTV. Archived from the original on August 10, 2016. Retrieved August 8, 2016.
- "Fastest-selling digital album in the US by a female artist". Guinness World Records. Archived from the original on June 22, 2015. Retrieved June 16, 2015.
- Knopper, Steve (November 25, 2010). "Taylor Swift's Speak Now Tops the Charts". Rolling Stone. Archived from the original on March 3, 2021. Retrieved November 25, 2010.
- Sheffield, Rob (October 26, 2010). "Speak Now (2010)". Rolling Stone. Archived from the original on September 11, 2013. Retrieved December 20, 2019.
- Hammel, Sara (January 4, 2011). "Taylor Swift & Jake Gyllenhaal Break Up: Source". People. Archived from the original on May 9, 2012. Retrieved March 6, 2012.
- Wyland, Sarah (February 12, 2012). "Taylor Swift Takes Home Two GRAMMYs at Tribute-Filled Show" (Blog). Great American Country. Archived from the original on September 6, 2015. Retrieved February 13, 2012.
- Shelburne, Craig (October 18, 2010). "Taylor Swift Named NSAI's Songwriter-Artist of the Year". CMT. Archived from the original on January 16, 2016. Retrieved November 21, 2015.
- Smith, Hazel (October 24, 2011). "News : Hot Dish: Taylor Swift Sings Alan Jackson's Masterpiece at Nashville Songwriters Celebration". CMT. Archived from the original on November 29, 2014. Retrieved April 22, 2012.
- Roland, Tom (December 2, 2011). "Taylor Swift: Billboard's Woman of the Year". Billboard. Archived from the original on February 3, 2013. Retrieved May 15, 2012.
- Talbott, Chris; Silva, Cristina (April 2, 2012). "Taylor Swift wins ACM entertainer of the year". Yahoo!. Associated Press. Archived from the original on August 23, 2016. Retrieved May 15, 2012.
- "CMA Awards 2011: Taylor Swift wins entertainer of the year". CBS News. November 9, 2011. Archived from the original on September 8, 2014. Retrieved May 15, 2012.
- Kellogg, Jane (November 20, 2011). "AMAs 2011: Winners and Nominees Complete List". The Hollywood Reporter. Archived from the original on June 27, 2015. Retrieved November 21, 2015.
- Sheffield, Rob (June 23, 2012). "Women Who Rock: The 50 Greatest Albums of All Time". Rolling Stone. Archived from the original on December 10, 2016. Retrieved July 15, 2017.
- Allen, Bob (March 29, 2012). "Hot Tours: Taylor Swift, George Strait, Cirque Du Soleil". Billboard. Archived from the original on February 21, 2013. Retrieved May 10, 2012.
- "Taylor Swift News and Blog". taylorswift.com. September 21, 2011. Archived from the original on October 11, 2011. Retrieved September 21, 2011.
- Herrera, Monica (March 15, 2012). "Taylor Swift, Arcade Fire Talk 'Hunger Games'". Rolling Stone. Archived from the original on June 27, 2015. Retrieved May 10, 2012.
- "Nominations 2013 — Golden Globe Awards". goldenglobes.org. December 13, 2012. Archived from the original on December 14, 2012. Retrieved December 13, 2012.
- Horowitz, Steven J. (April 20, 2012). "B.o.B Explains Origins of Taylor Swift Collaboration 'Both of Us'". HipHopDX. Archived from the original on September 10, 2015. Retrieved May 15, 2012.
- Toomedy, Alyssa (October 25, 2012). "Taylor Swift and Conor Kennedy Breakup: Anatomy of a Split". E! News. Archived from the original on December 4, 2015. Retrieved November 10, 2015.
- Trust, Gary (August 22, 2012). "Taylor Swift Scores First Hot 100 No. 1". Billboard. Archived from the original on February 13, 2013. Retrieved August 22, 2012.
- "Discography Taylor Swift". New Zealand Charts. Archived from the original on April 20, 2017. Retrieved July 26, 2016.
- Lynch, Kevin (September 4, 2013). "Calvin Harris trumps Michael Jackson feat to join Taylor Swift, Rihanna and One Direction in Guinness World Records™ 2014 book". Guinness World Records. Archived from the original on June 22, 2015. Retrieved June 16, 2015.
- Chart positions:
- • "Taylor Swift – I Knew You Were Trouble". ARIA Charts. Archived from the original on May 27, 2016. Retrieved February 14, 2021.
- • "Official Singles Charts Top 100". Official Charts Company. Archived from the original on July 13, 2021. Retrieved February 14, 2021.
- • "Taylor Swift Leads Record Breaking Digital Sales Week". Billboard. January 3, 2013. Archived from the original on April 8, 2017. Retrieved February 14, 2021.
- Lewis, Randy (October 30, 2012). "Taylor Swift raises the bar with a savvy 'Red' marketing campaign". Los Angeles Times. Archived from the original on December 28, 2020. Retrieved December 28, 2020.
- Mansfield, Brian (October 17, 2012). "Taylor Swift sees 'Red' all over". USA Today. Archived from the original on December 21, 2012.
- English, J. (August 28, 2017). "Taylor Swift's 'Red': A Canonical Coming-Of-Age Album". NPR. Archived from the original on April 12, 2021. Retrieved February 14, 2021.
- Roberts, Randall (October 31, 2012). "'The Last Time' connects Taylor Swift with Arcade Fire". Los Angeles Times. Archived from the original on March 6, 2016. Retrieved December 27, 2020.
- Greenwald, David (September 6, 2013). "Taylor Swift, Rihanna, Justin Bieber Among 2014 Guinness Record-Setters". Billboard. Archived from the original on June 8, 2015. Retrieved July 27, 2016.
- Sexton, Paul (August 31, 2019). "Taylor Swift Scores Fourth U.K. No. 1 With 'Lover' Album". Billboard. Archived from the original on August 16, 2021. Retrieved October 15, 2019.
- "Grammys 2014: The complete list of nominees and winners". Los Angeles Times. January 26, 2014. Archived from the original on March 4, 2015. Retrieved January 25, 2015.
- Gregoire, Carolyn (November 19, 2012). "Taylor Swift AMA Awards 2012: Pop Star Performs 'I Knew You Were Trouble' (Video)". HuffPost. Archived from the original on May 26, 2013. Retrieved June 10, 2013.
- Payne, Chris (November 25, 2013). "Taylor Swift & Justin Timberlake Win Big at American Music Awards". Billboard. Archived from the original on November 24, 2015. Retrieved November 21, 2015.
- "NSAI Songwriter/Artists of the Year". Nashville Songwriters Association International. Archived from the original on August 19, 2016. Retrieved August 2, 2016.
- Allen, Bob (July 3, 2014). "Taylor Swift's Red Wraps as All-Time Country Tour". Billboard. Archived from the original on June 1, 2015. Retrieved April 11, 2015.
- Caramanica, Jon (November 7, 2013). "Country Awards Hold Swift Close". The New York Times. Archived from the original on November 11, 2013. Retrieved April 3, 2014.
- "Taylor Swift's Boyfriend Timeline: 10 Relationships & Their Songs". Billboard. December 30, 2014. Archived from the original on August 26, 2016. Retrieved August 26, 2016.
- Labrecque, Jeff (December 12, 2013). "'12 Years a Slave' and 'American Hustle' lead Golden Globe nominees". Entertainment Weekly. Archived from the original on March 23, 2015. Retrieved December 12, 2013.
- Bonaguro, Alison (January 25, 2013). "News : Offstage: Tim McGraw Wanted to Make Taylor Swift Duet an Event". CMT. Archived from the original on July 12, 2015. Retrieved February 25, 2013.
- Blistein, Doyle (June 4, 2013). "Taylor Swift Joins Rolling Stones for 'As Tears Go By'". Rolling Stone. Archived from the original on June 9, 2013. Retrieved June 10, 2013.
- "Taylor Swift Joins Florida Georgia Line Onstage for 'Cruise'". Taste of Country. Townsquare Media. March 2, 2013. Archived from the original on March 16, 2013. Retrieved March 29, 2013.
- Collin, Robbie (July 26, 2012). "The Lorax, review". The Daily Telegraph. Archived from the original on September 17, 2016. Retrieved August 3, 2016.
- Beard, Lanford (May 1, 2013). "Taylor Swift says 'I do' to 'New Girl'". Entertainment Weekly. Archived from the original on November 8, 2016. Retrieved August 4, 2016.
- Busis, Hillary (September 27, 2013). "Taylor Swift will co-star in long-awaited adaptation of 'The Giver'". Entertainment Weekly. Archived from the original on December 21, 2016. Retrieved August 2, 2016.
- Peterson, Price (March 31, 2014). "Taylor Swift Moves into NYC Apartment Built Over Mysterious River of Pink Slime". The Atlantic. Archived from the original on September 27, 2016. Retrieved July 31, 2016.
- Rogers, Alex (March 7, 2014). "Why Taylor Swift Thinks Nashville Is the Best Place on Earth". Time. Archived from the original on May 24, 2022. Retrieved September 27, 2016.
- Milzoff, Rebecca; Brown, Eric Renner; Denis, Kyle (August 24, 2023). "Taylor Swift and Beyoncé Are So Big, Even Their Publicists Have Fans". Billboard. Archived from the original on August 24, 2023. Retrieved August 24, 2023.
- Zollo, Paul (February 17, 2016). "The Oral History of Taylor Swift's 1989". The Recording Academy. Archived from the original on June 3, 2021. Retrieved February 14, 2021.
- Stutz, Colin (October 16, 2014). "Watch Taylor Swift's '1989' Secret Sessions Behind The Scenes Video". Billboard. Archived from the original on June 5, 2016. Retrieved August 2, 2016.
- Caulfield, Keith (November 4, 2014). "Taylor Swift's "1989" debuts with 1.287 million copies sold". Billboard. Archived from the original on November 5, 2014. Retrieved November 4, 2014.
- Chart positions:
- • "Discography Taylor Swift". ARIA Charts. Archived from the original on August 26, 2019. Retrieved February 14, 2021.
- • "Taylor Swift Chart History (Canadian Hot 100)". Billboard. Archived from the original on August 9, 2016. Retrieved February 14, 2021.
- • "Taylor Swift's 'Bad Blood' Blasts to No. 1 on Hot 100". Billboard. May 28, 2015. Archived from the original on September 6, 2015. Retrieved May 28, 2015.
- "Taylor Swift – Chart History: Hot 100". Billboard. Archived from the original on March 8, 2018. Retrieved September 18, 2016.
- "Live Music's $20 Billion Year: The Grateful Dead's Fare Thee Well Reunion, Taylor Swift, One Direction Top Boxscore's Year-End". Billboard. Archived from the original on December 14, 2015.
- Weissmann, Jordan (July 7, 2014). "Taylor Swift Has Written an Op-Ed in the Wall Street Journal". Slate (Blog). Archived from the original on January 23, 2015. Retrieved January 23, 2015.
- Knopper, Steve (November 8, 2014). "Taylor Swift's Label Head Explains Spotify Removal". Rolling Stone. Archived from the original on April 21, 2015. Retrieved April 11, 2015.
- Peters, Mitchell (June 21, 2015). "Taylor Swift Pens Open Letter Explaining Why '1989' Won't Be on Apple Music". Billboard. Archived from the original on June 22, 2015. Retrieved June 22, 2015.
- Halperin, Shirley (June 21, 2015). "Apple Changes Course After Taylor Swift Open Letter: Will Pay Labels During Free Trial". Billboard. Archived from the original on June 22, 2015. Retrieved June 22, 2015.
- Rosen, Christopher (June 25, 2015). "Taylor Swift is putting 1989 on Apple Music". Entertainment Weekly. Archived from the original on June 26, 2015. Retrieved June 25, 2015.
- "Taylor Swift returns to Spotify on the day Katy Perry's album comes out". BBC News. June 9, 2017. Archived from the original on June 9, 2017.
- "Taylor Swift: 2014 Billboard Woman of the Year". Billboard. October 10, 2014. Archived from the original on June 1, 2015. Retrieved April 11, 2015.
- Payne, Chris (November 23, 2014). "Taylor Swift Wins Dick Clark Award of Excellence at 2014, Presented by Diana Ross". Billboard. Archived from the original on July 4, 2015. Retrieved April 11, 2015.
- "The Taylor Swift Experience". GRAMMY Museum. Archived from the original on November 25, 2022. Retrieved April 22, 2022.
- Boehrer, Kat (January 7, 2016). "Watch Taylor Swift's Stunning Acoustic Performance of 'Blank Space' at the Grammy Museum". Complex. Archived from the original on April 22, 2022. Retrieved April 22, 2022.
- Jonze, Tim (February 25, 2015). "Taylor Swift wins international female solo artist at Brit awards 2015". The Guardian. Archived from the original on January 1, 2016. Retrieved April 11, 2015.
- Stutz, Colin (July 21, 2015). "2015 MTV Video Music Awards Nominees Revealed: Taylor Swift, Kendrick Lamar, Ed Sheeran & More". Billboard. Archived from the original on July 24, 2015. Retrieved August 15, 2016.
- Lynch, Joe (February 19, 2016). "Taylor Swift Joins Elite Club to Win Grammy Album of the Year More Than Once: See the Rest". Billboard. Archived from the original on March 1, 2016. Retrieved July 31, 2016.
- Chiu, Melody (June 1, 2016). "Taylor Swift and Calvin Harris Split After 15 Months Together". People. Archived from the original on June 22, 2016. Retrieved June 1, 2016.
- Spanos, Brittany (July 13, 2016). "Taylor Swift Co-Wrote Calvin Harris' Smash Hit 'This Is What You Came For'". Rolling Stone. Archived from the original on July 30, 2016. Retrieved July 31, 2016.
- Grady, Constance (August 26, 2019). "How the Taylor Swift-Kanye West VMAs scandal became a perfect American morality tale". Vox. Archived from the original on December 2, 2022. Retrieved October 12, 2023.
- Grady, Constance (March 21, 2020). "Newly leaked footage shows Taylor Swift and Kanye West talking "Famous"". Vox. Archived from the original on March 24, 2022. Retrieved October 12, 2023.
- Lewis, Anna (July 15, 2016). "Tom Hiddleston finally tells us the truth about his relationship with Taylor Swift". Cosmopolitan. Archived from the original on July 17, 2016. Retrieved January 8, 2019.
- "Taylor Swift Finally Reveals When She Started Dating Joe Alwyn in Lover Album". Yahoo!. August 23, 2019. Archived from the original on June 11, 2020. Retrieved June 11, 2020.
- "Paul McCartney & Taylor Swift". Rolling Stone. November 13, 2020. Archived from the original on November 30, 2020. Retrieved September 15, 2021. McCartney: So how does that go? Does your partner sympathize with that and understand? Swift: Oh, absolutely.
- Irvin, Jack (April 10, 2023). "Inside Taylor Swift and Joe Alwyn's 'Differences' That Led to Their Breakup: Sources (Exclusive)". People. Archived from the original on September 25, 2023. Retrieved September 25, 2023.
- "Taylor Swift, pop princess, wins song of the year at the CMA Awards". USA Today. Archived from the original on November 9, 2017. Retrieved November 9, 2017.
- Trust, Gary (February 21, 2017). "Ed Sheeran Tops Hot 100, Katy Perry Debuts at No. 4 & Bruno Mars, Rihanna & The Weeknd All Hit Top 10". Billboard. Archived from the original on February 22, 2017. Retrieved February 22, 2017.
- Grady, Constance (August 11, 2017). "Taylor Swift won her day in court. Here's what you need to know". Vox. Archived from the original on October 17, 2022. Retrieved October 4, 2023.
- "Taylor Swift wipes social media profiles, fuelling expectations of new album". The Daily Telegraph. August 18, 2017. Archived from the original on January 8, 2019. Retrieved August 19, 2019.
- Aswad, Jem (August 24, 2017). "Taylor Swift's New Single, 'Look What You Made Me Do,' Arrives (Listen)". Variety. Archived from the original on August 28, 2017. Retrieved August 29, 2017.
- White, Jack (September 1, 2017). "Taylor Swift scores first Number 1 on the Official Singles Chart with 'LWYMMD'". Official Charts Company. Archived from the original on September 2, 2017. Retrieved September 1, 2017.
- Peak positions:
- • "Taylor Swift Scores Fifth No. 1 Single". Australian Recording Industry Association. September 2, 2017. Archived from the original on September 2, 2017. Retrieved September 2, 2017.
- • "IRMA – Irish Charts". Irish Recorded Music Association. Archived from the original on June 14, 2017. Retrieved September 2, 2017.
- • "NZ Top 40 Singles Chart". Recorded Music NZ. September 4, 2017. Archived from the original on September 1, 2017. Retrieved September 1, 2017.
- • "Taylor Swift at Nos. 1 & 4 on Billboard Hot 100, as Cardi B Moves Up to No. 2". Billboard. September 11, 2017. Archived from the original on September 21, 2017. Retrieved October 30, 2017.
- Shaw, Lucas (November 7, 2017). "Taylor Swift Will Keep New Album From Streaming for a Week". Bloomberg. Bloomberg News. Archived from the original on November 8, 2017. Retrieved November 7, 2017.
- Powers, Ann (November 10, 2019). "The Old Taylor's Not Dead". NPR. Archived from the original on June 9, 2020. Retrieved June 29, 2020.
- McDermott, Maeve (October 11, 2017). "Taylor Swift 'Reputation': Here's what critics are saying". USA Today. Archived from the original on March 4, 2020. Retrieved October 15, 2020.
- "Official: Taylor Swift's 'Reputation' Album Sells 1.2M Copies in US During First Week". Billboard. Archived from the original on November 30, 2017. Retrieved May 29, 2018.
- Chart positions:
- • "Taylor Swift's 'Reputation' Rules Australia's Albums Chart". Billboard. November 20, 2017. Archived from the original on November 20, 2017. Retrieved December 2, 2017.
- • "Taylor Swift Chart History". Billboard. Archived from the original on November 22, 2021. Retrieved November 19, 2021.
- Unterberger, Andrew (July 6, 2018). "Taylor Swift's 'Delicate' Became the Biggest Reputation Radio Hit While You Weren't Looking". Billboard. Archived from the original on December 13, 2020. Retrieved April 13, 2020.
- "61st Grammy Nominees". The Recording Academy. December 7, 2018. Archived from the original on December 7, 2018. Retrieved December 7, 2018.
- Hudak, Joseph (April 12, 2018). "Sugarland Announce New Album Bigger, Taylor Swift Collaboration". Rolling Stone. Archived from the original on April 14, 2018. Retrieved April 13, 2018.
- Havens, Lyndsey (October 9, 2018). "Taylor Swift Breaks an All-Time AMA Record – And Urges People to Vote in Midterm Elections". Billboard. Archived from the original on October 10, 2018. Retrieved October 10, 2018.
- Stubblebine, Allison (November 13, 2017). "Taylor Swift Announces First Round of Reputation Stadium Tour Dates". Billboard. Archived from the original on November 14, 2017. Retrieved November 18, 2017.
- Frankenberg, Eric (December 6, 2018). "Taylor Swift Closes Reputation Stadium Tour with $345 Million". Billboard. Archived from the original on December 9, 2018. Retrieved December 22, 2018.
- Wang, Amy X. (November 19, 2018). "Taylor Swift's New Record Deal Affects Thousands of Other Musicians". Rolling Stone. Archived from the original on November 26, 2018. Retrieved November 26, 2018.
-Willman, Chris (August 27, 2018). "Taylor Swift Stands to Make Music Business History as a Free Agent". Variety. Archived from the original on August 29, 2018. Retrieved August 29, 2018.
-Aswad, Jem; Willman, Chris (November 19, 2018). "Taylor Swift Signs New Deal With Universal Music Group". Variety. Archived from the original on November 19, 2018. Retrieved November 19, 2018.
- Grady, Constance (November 19, 2018). "What Taylor Swift's new record deal means for the music industry — and for her image". Vox. Archived from the original on December 20, 2021. Retrieved December 20, 2021.
- McKenna, Lyndsey (August 23, 2019). "Stream Taylor Swift's New Album, 'Lover'". NPR. Archived from the original on February 19, 2020. Retrieved September 10, 2019.
- Catucci, Nick (August 23, 2019). "Taylor Swift Reaches For New Heights of Personal and Musical Liberation on 'Lover'". Rolling Stone. Archived from the original on August 23, 2019. Retrieved February 15, 2021.
- Caulfield, Keith (September 1, 2019). "Official: Taylor Swift's 'Lover' Debuts at No. 1 on Billboard 200 Chart With 867,000 Units Earned in First Week in U.S." Billboard. Archived from the original on September 1, 2019. Retrieved September 2, 2019.
- White, Adam (August 23, 2019). "Taylor Swift Lover Review Round-Up: Critics Say Album Feels 'Evolutionary Rather Than Revolutionary'". The Independent. Archived from the original on June 13, 2022. Retrieved June 13, 2022.
- Moniuszko, Sara M. (August 23, 2019). "Taylor Swift Lover Reviews: Critics Are Enamored by the 'Earnest,' 'Romantic' New Album". USA Today. Archived from the original on August 23, 2019. Retrieved November 5, 2020.
- Trust, Gary (May 6, 2019). "Lil Nas X's 'Old Town Road' Tops Billboard Hot 100 For Fifth Week, Taylor Swift's 'Me!' Vaults to No. 2". Billboard. Archived from the original on May 6, 2019. Retrieved June 14, 2019.
- Trust, Gary (October 23, 2023). "Taylor Swift's 'Cruel Summer' Hits No. 1 on Billboard Hot 100, Becoming Her 10th Leader". Billboard. Archived from the original on October 24, 2023. Retrieved October 24, 2023.
- "Arashi Best-Of Tops Taylor Swift for IFPI's Best-Selling Album of 2019". Billboard. March 19, 2020. Archived from the original on March 19, 2020. Retrieved March 21, 2020.
- "2020 Grammy Awards: Complete Winners List". The Recording Academy. November 20, 2019. Archived from the original on May 22, 2020. Retrieved February 15, 2021.
- Grein, Paul (August 26, 2019). "12 Records That Were Set at the 2019 VMAs". Billboard. Archived from the original on January 30, 2020. Retrieved January 11, 2020.
- Grady, Constance (September 1, 2019). "The Taylor Swift/Scooter Braun controversy, explained". Vox. Archived from the original on February 11, 2020. Retrieved August 23, 2019.
- Beth, John (January 2, 2024). "Taylor Swift's Chart Triumph". Square News.
- "The Taylor Swift, Scooter Braun, Justin Bieber row explained". BBC News. July 1, 2019. Archived from the original on December 11, 2021. Retrieved July 18, 2021.
- Willman, Chris (November 16, 2020). "Taylor Swift Confirms Sale of Her Masters, Says She Is Already Re-Recording Her Catalog". Variety. Archived from the original on December 3, 2022. Retrieved November 18, 2020.
- Aniftos, Rania (November 15, 2019). "Taylor Swift Releases 'Beautiful Ghosts,' Co-Written With Andrew Lloyd Webber for 'Cats' Film". Billboard. Archived from the original on November 19, 2019. Retrieved November 15, 2019.
- "Golden Globes 2020: full list of nominations". The Guardian. December 9, 2019. Archived from the original on December 10, 2019. Retrieved December 20, 2019.
- Rooney, David (December 18, 2019). "'Cats': Film Review". The Hollywood Reporter. Archived from the original on December 20, 2019. Retrieved December 21, 2019.
- Mamo, Heran (January 15, 2020). "Taylor Swift Miss Americana Netflix Doc Has a Release Date & We're So Ready for It". Billboard. Archived from the original on April 24, 2020. Retrieved January 19, 2020.
- Willman, Chris (February 6, 2020). "Taylor Swift Moves to Universal Music Publishing Group with New Pact". Variety. Archived from the original on February 12, 2020. Retrieved February 6, 2020.
- Opperman, Jeff (March 12, 2021). "Taylor Swift Is Singing Us Back to Nature". The New York Times. Archived from the original on December 28, 2021. Retrieved May 24, 2021.
- "Taylor Swift to release surprise ninth album 'Evermore' tonight". NME. December 10, 2020. Archived from the original on December 10, 2020. Retrieved December 10, 2020.
- Atkinson, Katie (December 15, 2020). "Taylor Swift Isn't So Sure She & Joe Alwyn Would Have Made Music Together If It Weren't for Lockdown". Billboard. Archived from the original on August 11, 2021. Retrieved February 18, 2021.
- Schaffer, Claire (December 18, 2020). "Aaron Dessner on How His Collaborative Chemistry With Taylor Swift Led to Evermore". Rolling Stone. Archived from the original on December 22, 2020. Retrieved February 18, 2021.
- Barna, Alyssa (December 16, 2020). "These are the musicological reasons Taylor Swift's new album sounds dull". The Washington Post. Archived from the original on February 25, 2021. Retrieved November 3, 2021.
- Snapes, Laura (October 14, 2022). "'Genuine': why Taylor Swift can celebrate more than an album release". The Guardian. Archived from the original on October 14, 2022. Retrieved October 14, 2022.
- McGrath 2023, p. 79; Fogarty & Arnold 2021, p. 5.
- Trust, Gary (January 28, 2021). "Taylor Swift's 'Coney Island' and 'No Body, No Crime' Debut on Airplay Charts, Joining 'Willow'". Billboard. Archived from the original on August 16, 2021. Retrieved February 2, 2021.
- Willman, Chris (March 14, 2021). "Taylor Swift Becomes First Woman to Win Album of the Year Grammy Three Times". Variety. Archived from the original on December 2, 2021. Retrieved March 15, 2021.
- Caulfield, Keith (January 7, 2021). "Lil Baby's My Turn Is MRC Data's Top Album of 2020, Roddy Ricch's 'The Box' Most-Streamed Song". Billboard. Archived from the original on January 7, 2021. Retrieved January 7, 2021.
- Trust, Gary (December 21, 2020). "Taylor Swift's 'Willow' Debuts at No. 1 on Billboard Hot 100". Billboard. Archived from the original on December 22, 2020. Retrieved February 18, 2021.
- Willman, Chris (November 23, 2020). "Taylor Swift Wins Three American Music Awards, Says She's MIA Because of 'Recording All of My Old Music'". Variety. Archived from the original on December 2, 2021. Retrieved November 25, 2020.
- Christman, Ed (July 19, 2021). "Billboard's U.S. Money Makers: The Top Paid Musicians of 2020". Billboard. Archived from the original on July 24, 2021. Retrieved July 19, 2021.
- • Christman, Ed (July 19, 2021). "Billboard's 2020 Global Money Makers: The 5 Top Highest Paid Musicians". Billboard. Archived from the original on July 23, 2021. Retrieved July 19, 2021.
- Caulfield, Keith (July 11, 2023). "Taylor Swift's Re-Recorded Speak Now Already Has 2023's Biggest Week After 4 Days of Release". Billboard. Archived from the original on July 11, 2023. Retrieved July 11, 2023.
- Caulfield, Keith (April 18, 2021). "Taylor Swift's Re-Recorded Fearless Album Debuts at No. 1 on Billboard 200 Chart With Year's Biggest Week". Billboard. Archived from the original on April 18, 2021. Retrieved April 19, 2021.
- Asker, Jim; Trust, Gary (February 22, 2021). "Taylor Swift's 'Love Story (Taylor's Version)' Debuts at No. 1 on Hot Country Songs Chart: 'I'm So Grateful to the Fans'". Billboard. Archived from the original on April 22, 2021. Retrieved February 22, 2021.
- McCluskey, Megan (December 8, 2023). "Breaking Down Taylor Swift's 2023 Impact By the Numbers". Time. Archived from the original on December 26, 2023. Retrieved December 26, 2023.
- Horton, Adrian; Lee, Benjamin (February 6, 2023). "Grammy awards 2023: list of winners". The Guardian. Archived from the original on February 6, 2023. Retrieved February 6, 2023.
- Corcoran, Nina (August 28, 2022). "Taylor Swift Announces New Album Midnights, Breaks Record for Most Video of the Year Wins at 2022 VMAs". Pitchfork. Archived from the original on August 29, 2022. Retrieved August 28, 2022.
- "Taylor Swift's new album breaks Spotify streaming record". The Guardian. October 22, 2022. Archived from the original on October 22, 2022. Retrieved October 22, 2022.
- Harvilla, Rob (October 25, 2022). "The Anti-Hero We Deserve: Taylor Swift and Her Polarizing 'Midnights'". The Ringer. Archived from the original on November 3, 2022. Retrieved November 3, 2022.
- Light, Alan (October 24, 2022). "Taylor Swift's Midnights Does Something Astonishing. Even For Her". Esquire. Archived from the original on January 17, 2023. Retrieved January 17, 2023.
- Petridis, Alexis (October 21, 2022). "Taylor Swift: Midnights Review – Small-Hours Pop Rich with Self-Loathing and Stereotype-Smashing". The Guardian. Archived from the original on October 22, 2022. Retrieved October 21, 2022.
- Spanos, Brittany (October 21, 2022). "Taylor Swift Lets Us Into Her Darkest Dreams On Midnights". Rolling Stone. Archived from the original on October 21, 2022. Retrieved October 21, 2022.
- Sheffield, Rob (October 21, 2022). "Welcome to the Lavender Labyrinth: Taylor Swift's Midnights Is the Mastermind's Ultimate Power Move". Rolling Stone. Archived from the original on October 22, 2022. Retrieved October 23, 2022.
- Balasaygun, Kaitlin (November 1, 2022). "How Taylor Swift went back to the past and turned Midnights into her biggest album success yet". CNBC. Archived from the original on December 30, 2022. Retrieved December 30, 2022.
- Shafer, Ellise (October 21, 2022). "Taylor Swift's Midnights Breaks Spotify Record for Most-Streamed Album in a Single Day". Variety. Archived from the original on October 21, 2022. Retrieved October 22, 2022.
- Dailey, Hannah (December 6, 2022). "Here Are All of Taylor Swift's Biggest Accomplishments in 2022". Billboard. Archived from the original on April 30, 2023. Retrieved December 7, 2022.
- Trust, Gary (June 5, 2023). "Morgan Wallen's 'Last Night' No. 1 on Hot 100 for Ninth Week, Taylor Swift & Ice Spice's 'Karma' Blasts to No. 2". Billboard. Archived from the original on October 26, 2023. Retrieved August 21, 2023.
- Blistein, Jon; Guglielmi, Jodi (September 13, 2023). "Taylor Swift Makes History at 2023 VMAs". Rolling Stone. Archived from the original on September 13, 2023. Retrieved September 13, 2023.
- West, Bryan (February 5, 2024). "Taylor Swift makes Grammys history with fourth album of the year win for Midnights". USA Today. Archived from the original on February 5, 2024. Retrieved February 5, 2024.
- Caulfield, Keith (July 16, 2023). "Taylor Swift's Re-Recorded 'Speak Now' Debuts at No. 1 on Billboard 200 With 2023's Biggest Week". Billboard. Archived from the original on July 19, 2023. Retrieved July 16, 2023.
- Caulfield, Keith (November 5, 2023). "Taylor Swift's 1989 (Taylor's Version) Debuts at No. 1 on Billboard 200 With Biggest Week in Nearly a Decade". Billboard. Archived from the original on November 5, 2023. Retrieved November 5, 2023.
- Sherman, Maria (November 29, 2023). "Taylor Swift is Spotify's most-streamed artist of 2023, ending Bad Bunny's 3-year reign". ABC News. Archived from the original on November 29, 2023. Retrieved November 29, 2023.
- Garcia, Thania (November 28, 2023). "Taylor Swift Named Apple Music's Artist of the Year; Morgan Wallen Tops Global Songs Chart". Variety. Archived from the original on November 29, 2023. Retrieved November 29, 2023.
- "Best of 2023 (Taylor's Version) Playlist on Amazon Music". Curated by Amazon's Music Experts. Amazon Music. Retrieved December 3, 2023. Our most streamed artist of 2023 globally. It's Taylor's world and we are just living for it.
- Caulfield, Keith (November 21, 2023). "Taylor Swift Is Billboard's Top Artist of 2023". Billboard. Archived from the original on November 21, 2023. Retrieved November 21, 2023.
- Caulfield, Keith (December 3, 2023). "Taylor Swift's '1989 (Taylor's Version)' Returns to No. 1 on Billboard 200". Billboard. Retrieved December 3, 2023.
- Caulfield, Keith (January 10, 2024). "Morgan Wallen's One Thing at a Time Is Luminate's Top Album of 2023 in U.S." Billboard. Archived from the original on January 10, 2024. Retrieved January 12, 2024.
- Trust, Gary (November 6, 2023). "Taylor Swift's 'Is It Over Now? (Taylor's Version)' Debuts at No. 1 on Billboard Hot 100". Billboard. Retrieved November 6, 2023.
- Cohen, Jonathan (June 29, 2021). "Aaron Dessner, Justin Vernon Rev Up Big Red Machine With Help From Taylor Swift". Variety. Archived from the original on May 23, 2022. Retrieved February 10, 2022.
- Strauss, Matthew (February 19, 2021). "HAIM Enlist Taylor Swift for New "Gasoline" Remix". Pitchfork. Archived from the original on February 19, 2021. Retrieved February 10, 2022.
- Dailey, Hannah (February 11, 2022). "Ed Sheeran & Taylor Swift Release 'The Joker and the Queen' Remix: Watch the Video". Billboard. Archived from the original on February 11, 2022. Retrieved February 11, 2022.
- Rowley, Glenn (January 18, 2023). "The National Unveils 'First Two Pages of Frankenstein' Tracklist With Taylor Swift, Phoebe Bridgers & Sufjan Stevens". Billboard. Archived from the original on January 18, 2023. Retrieved January 18, 2023.
- Davis, Clayton (December 21, 2022). "Taylor Swift Doesn't Make Oscar Shortlist for All Too Well Short Film, but Advances for 'Carolina' Original Song". Variety. Archived from the original on December 24, 2022. Retrieved December 24, 2022.
- Utley, Riley (October 13, 2022). "Every Taylor Swift Movie Performance, Ranked". CinemaBlend. Archived from the original on October 13, 2022. Retrieved October 14, 2022.
- Lang, Brent (December 9, 2022). "Taylor Swift Making Feature Directing Debut for Searchlight Pictures". Variety. Archived from the original on December 10, 2022. Retrieved December 9, 2022.
- Wood, Mikael; Brown, August (August 1, 2023). "It's a love story, L.A. just says yes: How Taylormania took over the world". Los Angeles Times. Archived from the original on August 1, 2023. Retrieved August 1, 2023.
- Mahdawi, Arwa (November 20, 2022). "Swifties know: the Ticketmaster fiasco shows America has a monopoly problem". The Guardian. Archived from the original on December 10, 2022. Retrieved November 20, 2022.
- Murray, Conor (December 8, 2023). "Taylor Swift's Eras Tour Is First In History To Gross Over $1 Billion, Report Says". Forbes. Archived from the original on December 8, 2023. Retrieved December 8, 2023.
- Tapp, Tom (December 8, 2023). "Taylor Swift's 'The Eras Tour' Grosses Over $1 Billion In 2023, The Biggest Haul For Any Act Ever". Deadline. Archived from the original on February 6, 2024. Retrieved February 10, 2024.
- Kaufman, Gil (November 28, 2023). "Taylor Swift's 'Eras Tour' Concert Movie Passes $250 Million in Worldwide Grosses". Billboard. Archived from the original on December 1, 2023. Retrieved December 1, 2023.
- Nordyke, Kimberly (January 7, 2024). "Golden Globes 2024 Winners List". The Hollywood Reporter. Archived from the original on January 8, 2024. Retrieved January 8, 2024.
- Adamczyk, Alicia; Abrams, Joseph (July 25, 2023). "The brilliant marketing synergy of Taylor Swift's Eras Tour and her rerecorded albums". Fortune. Archived from the original on August 21, 2023. Retrieved August 21, 2023.
- Ingham, Tim (June 14, 2023). "Reliving the Taylor Swift Catalog Sale Saga (And Following the Money...)". Music Business Worldwide. Archived from the original on June 14, 2023. Retrieved June 15, 2023.
- Blanchet, Brenton (November 20, 2023). "Travis Kelce Shares the Real Story of How Taylor Swift Romance Began in Wide-Ranging Interview". People. Archived from the original on November 20, 2023. Retrieved November 20, 2023.
- Kelly, Samantha Murphy (January 25, 2024). "Explicit, AI-generated Taylor Swift images spread quickly on social media". CNN Business. Archived from the original on January 25, 2024. Retrieved January 25, 2024.
- Phillips, Zoe G. (January 27, 2024). "SAG-AFTRA and White House Issue Statements on Taylor Swift AI Nudes: "We Have It in Our Power to Control These Technologies"". The Hollywood Reporter. Archived from the original on January 27, 2024. Retrieved January 27, 2024.
- "Taylor Swift Announces 'Brand New Album' 'The Tortured Poets Department' with 13th Grammy Win". Peoplemag. Archived from the original on February 10, 2024. Retrieved February 10, 2024.
- Cairns, Dan (March 5, 2009). "Swift rise of the anti-diva". The Australian. Archived from the original on December 24, 2014. Retrieved July 2, 2012.
- Bream, Jon (December 7, 2007). "Music: OMG! Taylor's senior year". Star Tribune. Archived from the original on July 12, 2015. Retrieved July 1, 2012.
- Newman, Melinda (December 19, 2008). "Taylor Swift Sessions Interview". AOL. Archived from the original on October 9, 2012. Retrieved March 25, 2011.
- "Swift starts world tour in Asia, pushes "Speak Now' in NY". Country Standard Time. October 23, 2007. Archived from the original on November 13, 2012. Retrieved July 1, 2012.
- "News : 20 Questions With Taylor Swift". Country Music Television. November 12, 2007. Archived from the original on November 17, 2014. Retrieved April 18, 2012.
- McCafferty, Dennis (April 13, 2008). "Taylor's Swift rise". USA Weekend. Archived from the original on November 14, 2012. Retrieved April 17, 2012.
- "Interview with Taylor Swift". Time. April 23, 2009. Archived from the original on October 23, 2013. Retrieved July 1, 2012.
- "Taylor Swift Style: Singer Won't Take Her Clothes Off, Wants People To Focus On Music". HuffPost. October 23, 2012. Archived from the original on January 4, 2015. Retrieved January 4, 2015.
- "InStyle meets country singing sensation Taylor Swift". InStyle UK. October 26, 2010. Archived from the original on May 27, 2013. Retrieved May 29, 2012.
- "Joni Mitchell: 15 Great Artists Influenced by the 'Blue' Singer". Rolling Stone. June 22, 2016. Archived from the original on December 26, 2021. Retrieved December 26, 2020.
- Jenkins, Sally (September 28, 2023). "You thought you knew the NFL. Now meet Taylor's Version". The Washington Post. Archived from the original on October 26, 2023. Retrieved September 29, 2023.
- Bonaguro, Alison (November 8, 2012). "Offstage: Taylor Swift Inspired by Female Singer-Songwriters of the '90s". CMT. Archived from the original on October 4, 2023. Retrieved September 29, 2023.
- "Taylor Swift's Favorite Music". The Oprah Winfrey Show. Archived from the original on January 16, 2016. Retrieved October 23, 2012.
- Widdicombe, Lizzie (October 10, 2011). "You Belong With Me". The New Yorker. Archived from the original on July 24, 2014. Retrieved October 11, 2011.
- Mansfield, Brian (October 23, 2010). "Taylor Swift learns to 'Speak Now,' reveal her maturity". USA Today. Archived from the original on November 4, 2012. Retrieved July 1, 2012.
- Block, Melissa (October 31, 2014). "'Anything That Connects': A Conversation With Taylor Swift". NPR Music. Archived from the original on February 6, 2015. Retrieved October 26, 2019.
- Eells, Josh (September 8, 2014). "The Reinvention of Taylor Swift". Rolling Stone. Archived from the original on June 4, 2016. Retrieved June 8, 2016.
- Reid, Poppy (November 2, 2021). "The Curious Case of Keith Urban". Rolling Stone. Archived from the original on November 19, 2021. Retrieved November 3, 2021.
- Hiatt, Brian (June 18, 2019). "Taylor Swift: The Rolling Stone Interview". Rolling Stone. Archived from the original on September 18, 2019. Retrieved April 14, 2022.
- Weatherby, Taylor (March 10, 2021). "Taylor Swift's Road to Folklore". The Recording Academy. Archived from the original on November 25, 2021. Retrieved November 24, 2021.
- Franssen, Gaston (January 2, 2022). "Policing the celebrity of Taylor Swift: introduction". Celebrity Studies. 13 (1): 90–92. doi:10.1080/19392397.2022.2026148. S2CID 246997248.
- Savage, Mark (October 19, 2022). "Midnights: What we know about Taylor Swift's songwriting". BBC News. Archived from the original on October 19, 2022. Retrieved October 20, 2022.
- Bruner, Raisa (August 24, 2020). "Let's Break Down Taylor Swift's Tender New Album Folklore". Time. Archived from the original on July 31, 2020. Retrieved October 20, 2022.
- McNutt 2020, p. 77.
- Hughes 2017, p. 206; Perone 2017, p. 33.
- "Taylor Swift: Album Guide". Rolling Stone. Archived from the original on December 5, 2012. Retrieved December 5, 2012.
- "Pop and Rock Listings July 22 – 28". The New York Times. July 21, 2011. Archived from the original on January 28, 2012. Retrieved July 12, 2012.
- "Taylor Swift Remade Fearless as Taylor's Version. Let's Discuss". The New York Times. April 9, 2021. Archived from the original on April 9, 2021. Retrieved April 21, 2021.
- Petridis, Alexis (March 6, 2009). "Taylor Swift: Fearless". The Guardian. Archived from the original on October 16, 2013. Retrieved August 13, 2022.
- Jones, Sasha-Frere (November 11, 2008). "Prodigy". The New Yorker. Archived from the original on October 21, 2016. Retrieved August 14, 2022.
- Hughes 2017, p. 206.
- Malec, Jim (May 2, 2011). "Taylor Swift: The Garden In The Machine". American Songwriter. p. 5. Archived from the original on November 20, 2022. Retrieved August 12, 2022.
- McNutt 2020, p. 78.
- Rosen, Jody (November 17, 2013). "Why Taylor Swift Is the Reigning Queen of Pop". Vulture. Archived from the original on November 19, 2013. Retrieved November 9, 2020.
- McNutt 2020, p. 79.
- Levine, Nick (August 21, 2019). "Taylor Swift's Lover: The struggle to maintain superstardom". BBC. Archived from the original on March 1, 2021. Retrieved October 29, 2021.
- da Silva, Michelle (November 13, 2017). "Taylor Swift Has Changed for the Worse on Reputation". Now. Archived from the original on July 26, 2020. Retrieved July 27, 2020.
- Tucker, Ken (November 13, 2017). "Taylor Swift Pushes Further Into Electro-Pop With 'Reputation'". NPR. Archived from the original on October 27, 2021. Retrieved April 8, 2023.
- Moreland, Quinn (October 24, 2022). "Taylor Swift: Midnights". Pitchfork. Archived from the original on October 24, 2022. Retrieved April 8, 2023.
- Ryan, Elise (October 21, 2022). "Review: Taylor Swift gets dark, electric on 'Midnights'". Associated Press News. Archived from the original on October 21, 2022. Retrieved April 8, 2023.
- Winter, Velvet (November 12, 2022). "Like The Beatles, Madonna and Kylie Minogue before her, Taylor Swift is masterful at pivoting". ABC News. Archived from the original on November 13, 2022. Retrieved November 13, 2022.
- McNutt 2020, p. 79; Sloan 2021, p. 17.
- Sloan 2021, p. 17.
- Hyden, Steven (March 10, 2021). "Taylor Swift, Indie-rock star? Long, Long ago, this might have felt strange". The New York Times. Archived from the original on April 13, 2021. Retrieved April 13, 2021.
- Caramanica, Jon (July 26, 2020). "Taylor Swift, A Pop Star Done with Pop". The New York Times. Archived from the original on September 10, 2020. Retrieved August 14, 2022.
- Harbron, Lucy (November 11, 2021). "Why Taylor Swift's 'Red' Is Her Turning Point". Clash. Archived from the original on November 12, 2021. Retrieved November 12, 2021.
- Gerber, Brady (July 27, 2020). "The Story Behind Every Song on Taylor Swift's folklore". Vulture. Retrieved December 12, 2023.
- Willman, Chris (October 21, 2022). "Taylor Swift's Midnights Marks a Return to Electronic, Confessional Pop That's Worth Losing Sleep Over: Album Review". Variety. Archived from the original on October 21, 2022. Retrieved October 21, 2022.
- Fulford 2014, p. 192.
- "Taylor Swift Deepens Her Goth-Folk Vision on the Excellent 'Evermore'". Rolling Stone. December 11, 2020. Archived from the original on December 11, 2020. Retrieved August 23, 2022.
- "The 200 Greatest Singers of All Time". Rolling Stone. January 1, 2023. Archived from the original on January 1, 2023. Retrieved January 1, 2023.
- Provenzano 2018, p. 173.
- Roland, Tom (October 15, 2010). "Taylor Swift: The Billboard Cover Story". Billboard. Archived from the original on October 18, 2010. Retrieved July 3, 2012.
- Provenzano 2018, pp. 173–174.
- Provenzano 2018, p. 174.
- Powers, Ann (October 25, 2010). "Album review: Taylor Swift's Speak Now". Los Angeles Times. Archived from the original on October 28, 2010. Retrieved October 25, 2010.
- Willman, Chris (November 10, 2017). "Album Review: Taylor Swift's 'Reputation'". Variety. Retrieved April 8, 2023.
- Cox, Jamieson (November 13, 2017). "Taylor Swift: Reputation". Pitchfork. Retrieved April 8, 2023.
- Powers, Ann (November 10, 2017). "The Old Taylor's Not Dead". NPR. Retrieved April 8, 2023.
- Wilson, Carl (November 13, 2017). "On Reputation, the "Old Taylor" Is Dead, but the New One Isn't Quite Ready to Come to the Phone". Slate. Retrieved April 8, 2023.
- DeCaro, Alessandro (October 19, 2022). "10 best Taylor Swift scene covers". Alternative Press. Retrieved July 1, 2023.
- Barker, Andrew (November 27, 2020). "Folklore: The Long Pond Studio Sessions Review". Variety. Retrieved May 31, 2021.
- Lipshutz, Jason (March 18, 2023). "The 13 Best Moments From Taylor Swift's Eras Tour Kickoff". Billboard. Retrieved April 8, 2023.
- Kornhaber, Spencer (July 28, 2020). "Taylor Swift Is No Longer Living in the Present". The Atlantic. Retrieved August 23, 2022.
- Brehian, Tom (July 24, 2020). "Review: Taylor Swift's 'folklore' Is An Indie Record Unconcerned With Being Cool". Stereogum. Retrieved August 23, 2022.
- Willman, Chris (December 11, 2020). "Taylor Swift Has Her Second Great Album of 2020 With 'Evermore': Album Review". Variety. Retrieved August 23, 2022.
- Sodomsky, Sam (December 15, 2020). "Taylor Swift: evermore". Pitchfork. Archived from the original on December 15, 2020. Retrieved December 14, 2020.
- McCormick, Neil (April 9, 2021). "Taylor Swift copies her younger self – and she sounds even more Fearless today". The Daily Telegraph. Retrieved August 23, 2022.
- "Taylor Swift forges ahead with a dreamy throwback in Fearless (Taylor's Version)". The A.V. Club. April 9, 2021. Archived from the original on April 9, 2021. Retrieved August 23, 2022.
- Bernstein, Jonathan (April 9, 2021). "Taylor Swift Carefully Reimagines Her Past on 'Fearless: Taylor's Version'". Rolling Stone. Retrieved August 23, 2022.
- Solomon, Kate (November 12, 2021). "Taylor Swift, Red (Taylor's Version), Review: How Brilliant She Is When Her Heart Is in Tatters". i. Archived from the original on November 12, 2021. Retrieved November 13, 2021.
- Snapes, Laura (August 23, 2020). "Taylor Swift: Folklore review – bombastic pop makes way for emotional acuity". The Guardian. Retrieved August 23, 2022.
- Snapes, Laura (November 12, 2021). "Taylor Swift: Red (Taylor's Version) Review – Getting Back Together with a Classic". The Guardian. Archived from the original on November 12, 2021. Retrieved November 12, 2021.
- Kelly, Fred (October 21, 2022). "Taylor Swift's Midnights: what the critics are saying". The Week. Retrieved October 23, 2022.
- Petrusich, Amanda (June 12, 2023). "The Startling Intimacy of Taylor Swift's Eras Tour". The New Yorker. Retrieved June 12, 2023.
- "Taylor Swift's songwriting: how the star's music has changed, for better or worse". CBC Music. August 22, 2019. Retrieved November 10, 2021.
- Emily, Lee (November 5, 2021). "Here Are Taylor Swift's Best Bridges On 'Red' Ranked". iHeartRadio. Retrieved November 10, 2021.
- Eggertsen, Chris (September 20, 2022). "Taylor Swift's Iconic Songwriting Credits Amplified By Spotify With Dedicated Page". Billboard. Retrieved September 20, 2022.
- Bate, Jonathan (April 10, 2023). "Why Taylor Swift is a literary giant — by a Shakespeare professor". The Times. Retrieved April 10, 2023.
- Pazzanese, Christina (August 2, 2023). "So what exactly makes Taylor Swift so great?". Harvard Gazette. Retrieved August 7, 2023.
- Murphy, Sam (November 10, 2021). "How 'Red' Became The Most Pivotal Record In Taylor Swift's Career". Junkee. Retrieved November 10, 2021.
- Siroky, Mary (November 9, 2021). "Every Taylor Swift Album Ranked from Worst to Best". Consequence. Retrieved November 10, 2021.
- Bruner, Raisa (May 24, 2021). "How Olivia Rodrigo Become America's Biggest New Pop Star". Time. Retrieved November 10, 2021.
- Mulvey, John (September 16, 2023). "Arctic Monkeys, Taylor Swift, Kendrick Lamar, Lana Del Rey And The 30 Artists Who Will Shape The Next 30 Years". Mojo. Retrieved September 19, 2023.
- Farley, Christopher John (October 22, 2010). "Taylor Swift's Solo Act". The Wall Street Journal. Archived from the original on February 1, 2015. Retrieved May 24, 2012.
- Jo Sales, Nancy; Diehl, Jessica (April 2013). "Taylor Swift's Telltale Heart". Vanity Fair. Archived from the original on January 30, 2017. Retrieved February 4, 2017.
- Daly, Rhian (December 13, 2020). "Taylor Swift says her diaristic songwriting style was 'unsustainable' for her future". NME. Retrieved February 17, 2021.
- Gallo, Phil (October 22, 2012). "Taylor Swift's Red: The Billboard Cover Story". Billboard. Archived from the original on June 14, 2013.
- Caramanica, Jon (October 20, 2010). "Taylor Swift Is Angry, Darn It". The New York Times. Archived from the original on September 11, 2012. Retrieved July 2, 2012.
- Kelly, James (August 26, 2009). "Taylor Swift writing her own songs and rules". The Atlanta Journal-Constitution. Archived from the original on September 8, 2014. Retrieved July 30, 2012.
- Lansky, Sam (November 8, 2017). "Why Taylor Swift's Red Is Her Best Album". Billboard. Retrieved December 27, 2020.
- Hiatt, Brian (September 30, 2019). "9 Taylor Swift Moments That Didn't Fit in Our Cover Story". Rolling Stone. Archived from the original on October 1, 2019. Retrieved December 9, 2019.
- "Taylor Swift Talks Newfound 'Freedom,' 'Lover' Tour Plans and So Much More". On Air with Ryan Seacrest. August 27, 2019. Retrieved March 22, 2020.
- Yuan, Jada (December 30, 2009). "Microwaving a tragedy: The marriage of romance and romanticism in '00s pop". Las Vegas Weekly. Archived from the original on December 21, 2013. Retrieved August 17, 2012.
- Rotman, Natalie (January 9, 2009). "Colbie Caillat has 'Breakthrough' with sophomore CD". Reading Eagle. Archived from the original on December 21, 2013. Retrieved August 17, 2012.
- "Taylor Swift's songwriting: how the star's music has changed, for better or worse". CBC News. Retrieved February 2, 2021.
- Knibbs, Kate (August 21, 2019). "Ten Years of Taylor Swift: How the Pop Star Went From Sweetheart to Snake (and Back Again?)". The Ringer. Retrieved December 13, 2021.
- Stubbs, Dan (October 9, 2015). "Taylor Swift: Power, Fame And The Future – The Full NME Cover Interview". NME. Retrieved February 17, 2021.
- Weber, Theon (November 3, 2010). "The Iceberg Songs of Taylor Swift". The Village Voice. Archived from the original on November 4, 2015. Retrieved July 30, 2012.
- Beck, Julia (October 27, 2014). "Taylor Swift Is So Much More Fun Now That She's Jaded". The Atlantic. Archived from the original on September 27, 2016. Retrieved October 30, 2021.
- Willman, Chris (October 10, 2010). "Princess Crossover". New York. Archived from the original on July 27, 2013. Retrieved July 1, 2012.
- Rosen, Jody (November 13, 2008). "Fearless". Rolling Stone. Archived from the original on August 15, 2012. Retrieved July 1, 2012.
- Powers, Ann (October 30, 2014). "The Many New Voices of Taylor Swift". NPR. Retrieved June 2, 2022.
- Stoeffel, Kat (November 16, 2012). "Stop Asking Taylor Swift to Apologize for Writing Songs About Ex-Boyfriends – The Cut". New York. Archived from the original on November 27, 2012. Retrieved February 25, 2013.
- Raven, Robin (March 16, 2022). "10 Artists Who Have Stood Up For Women In Music: Taylor Swift, Lizzo & More". The Recording Academy.
- "Cover Preview: Taylor Swift Fights Back About Her Love Life, the Hyannis Port House—and Has Words for Tina Fey and Amy Poehler". Vanity Fair. March 5, 2013. Archived from the original on August 8, 2016. Retrieved August 3, 2016.
- Dominus, Susan (November 16, 2012). "The Many Insecurities of Taylor Swift". The New York Times. Archived from the original on June 17, 2016.
- Doyle, Patrick (November 13, 2020). "Musicians on Musicians: Paul McCartney and Taylor Swift". Rolling Stone. Archived from the original on November 30, 2020. Retrieved February 7, 2021.
- Olivier, Bobby (December 11, 2020). "Taylor Swift's 'Evermore' Is an Undeniable Folk-Pop Masterpiece". Spin. Retrieved February 1, 2021.
- Shutler, Ali (October 9, 2022). "Taylor Swift organises her lyrics into three 'dorky' pen-themed categories". NME. Retrieved October 18, 2022.
- Browne, Erin (October 21, 2022). "All of Taylor Swift's Famously Devastating Track 5's, Ranked". Vulture. Retrieved October 27, 2022.
- "NMPA to Honor Taylor Swift with Songwriter Icon Award Among Other 2021 Annual Meeting Honorees". National Music Publishers' Association. May 24, 2021. Retrieved May 24, 2021.
- Linker, Damon (November 26, 2021). "Taylor Swift, Phoebe Bridgers, and Rihanna: How women took over songwriting". The Week. Retrieved November 28, 2021.
- Greco, Patti (November 13, 2017). "A Harvard Professor Critiques Taylor Swift's New Poems". Cosmopolitan. Retrieved December 21, 2021.
- Sheffield, Rob (October 13, 2023). "Taylor Swift's 'Eras Tour' Movie Will Make You Sing, Scream, and Sob". Rolling Stone. Retrieved December 8, 2023.
- Zacharek, Stephanie (December 14, 2023). "The Eras Tour Movie Is Irresistible No Matter How Much You Think You Like Taylor Swift". TIME. Retrieved December 8, 2023.
- "Ticketing Shmicketing: Taylor Swift's 'Eras Tour' Debut Slays (And Could Break All-Time Touring Record)". Pollstar. March 18, 2023. Archived from the original on March 20, 2023. Retrieved June 30, 2023.
- Aramesh, Waiss David (March 18, 2023). "Taylor Swift's The Eras Tour Is a 3-Hour Career-Spanning Victory Lap". Rolling Stone. OCLC 1787396. Archived from the original on March 18, 2023. Retrieved June 30, 2023.
- Gambles, Sarah (July 23, 2023). "The ubiquitous power of Taylor Swift". Deseret News. Retrieved July 23, 2023.
- McCormick, Neil (March 18, 2023). "Taylor Swift: The Eras Tour, review: a roaring spectacle of a comeback". The Daily Telegraph. Archived from the original on March 18, 2023. Retrieved March 18, 2023.
- Kornhaber, Spencer (March 18, 2023). "What Made Taylor Swift's Concert Unbelievable". The Atlantic. Retrieved June 30, 2023.
- Foggatt, Tyler (June 3, 2023). "Look What Taylor Made Us Do". The New Yorker. Retrieved June 30, 2023.
- Seibert, Brian (August 9, 2023). "How to Command a Stage Without Great Dance Moves (Taylor's Version)". The New York Times. Retrieved August 11, 2023.
- Krelenstein, Greg (May 21, 2018). "TAYLOR SWIFT'S REPUTATION TOUR IS A POP TRIUMPH". V. Archived from the original on May 22, 2018. Retrieved May 22, 2018.
- Frere-Jones, Sasha (November 3, 2008). "Prodigy". The New Yorker. Retrieved June 30, 2023.
- Horton, Adrian (March 18, 2023). "Taylor Swift review – pop's hardest-working star gives Eras tour her all". The Guardian. Archived from the original on March 18, 2023. Retrieved March 18, 2023.
- Kaplan, Ilana (March 18, 2023). "Taylor Swift's 'Eras' tour is a thrilling spectacle from a pop mastermind". i. Archived from the original on March 18, 2023. Retrieved March 18, 2023.
- Young, Alex (March 27, 2023). "Taylor Swift's "The Eras Tour" Is a Triumph of Spectacle and Stamina: Review". Consequence. Retrieved June 30, 2023.
- Lipshutz, Jason (March 18, 2023). "The 13 Best Moments From Taylor Swift's Eras Tour Kickoff". Billboard. Retrieved July 1, 2023.
- O'Connor, Roisin (June 8, 2018). "Taylor Swift 'reputation' stadium tour review: Dazzling pop spectacle from the star who doesn't stand still". The Independent. Archived from the original on June 30, 2023. Retrieved December 22, 2019.Savage, Mark (March 18, 2023). "Taylor Swift launches Eras tour with three-hour, 44-song set". BBC News. Archived from the original on March 18, 2023. Retrieved March 18, 2023. Sisario, Ben (November 5, 2023). "How Taylor Swift's Eras Tour Conquered the World". The New York Times. Retrieved August 12, 2023. DeVille, Chris (July 12, 2018). "Big Reputation: A Trip To Taylor Swift's Hyper-Maximalist Stadium Tour". Stereogum. Retrieved June 30, 2023.
- Procell, Carlie; Padilla, Ramon (April 28, 2023). "Taylor Swift tour has many 'eras.' We tracked her movements to give you the look and feel". USA Today. Retrieved June 30, 2023.
- "Taylor Swift Shares Stunning 'Wildest Dreams' Performance from Grammy Museum". Billboard. January 5, 2016. Retrieved October 29, 2023.
- Burgham, Lydia (November 10, 2018). "Taylor Swift in Auckland, reviewed: Despite the snakes, her Reputation shines on". The Spinoff. Retrieved December 10, 2019.
- Dodd, Sophie (November 15, 2023). "All About Taylor Swift's Parents, Scott and Andrea Swift". People. Retrieved December 3, 2023.
- Swift, Taylor (March 15, 2013). ""Sparks Fly" (acoustic) Live on the RED Tour!" – via YouTube.
- Lewis, Randy (April 3, 2011). "Academy of Country Music Awards: Las Vegas welcomes Miranda Lambert, Taylor Swift with open arms". Los Angeles Times. Retrieved August 20, 2023.
- Ritchie, Mike (March 8, 2020). "Why Taylor Swift is making the ukulele cool again". The Herald. Retrieved July 1, 2023.
- Gensler, Andy (August 17, 2023). "The Showgoer: The Greatest Show On Earth — Taylor Swift's 'Eras Tour' — Is All That And Far More". Pollstar. Retrieved August 19, 2023.
- Sheffield, Rob (May 9, 2018). "Why Taylor Swift's 'Reputation' Tour Is Her Finest Yet". Rolling Stone. Retrieved June 30, 2023.
- Willman, Chris (May 16, 2018). "Taylor Swift's 'Reputation' Tour Has Bad Blood, Good Will, Sex Appeal and Serpents". Variety. Retrieved December 22, 2019.
- Willman, Chris (March 18, 2023). "Taylor Swift's 'Eras' Show Is a Three-Hour, 44-Song Epic That Leaves 'Em Wanting More: Concert Review". Variety. Archived from the original on March 18, 2023. Retrieved June 30, 2018.
- Ordoña, Michael (September 9, 2022). "Taylor Swift wants an Oscar. So she took 'All Too Well' to TIFF". Los Angeles Times. Retrieved September 10, 2022.
- CMT.com Staff (May 4, 2011). "Taylor Swift's "Mean" Video Debuts Friday". CMT. Archived from the original on June 19, 2019. Retrieved June 19, 2019.
- Anitai, Tamar (August 27, 2010). "Video Premiere: Taylor Swift, 'Mine'". MTV News. Archived from the original on April 29, 2019. Retrieved June 19, 2019.
- Bonaguro, Alison (May 6, 2011). "OFFSTAGE: Taylor Swift Isn't 'Mean' at All, Director Says". CMT News. Archived from the original on June 19, 2019. Retrieved June 20, 2019.
- Tailor, Leena (September 1, 2017). "Exclusive: Taylor Swift's Director Joseph Kahn on How Her Image Invokes a Double Standard: 'She's a Genius'". Entertainment Tonight. Archived from the original on June 19, 2019.
- O'Connell, Michael (October 9, 2015). "Taylor Swift and Jimmy Fallon Among Early Emmy Winners". The Hollywood Reporter. Archived from the original on June 19, 2019.
- Forbes, Jihan (May 14, 2015). "Peep Taylor Swift's Star-Studded Cast for Her 'Bad Blood' Music Video". The Fashion Spot. Retrieved May 13, 2020.
- "9 Things You Might Have Missed in Taylor Swift's Netflix Concert Film". E! News. December 31, 2018. Retrieved September 10, 2022.
- Spanos, Brittany (April 25, 2019). "Watch Taylor Swift, Brendon Urie's Colorful 'ME!' Video". Rolling Stone. Archived from the original on April 26, 2019. Retrieved April 25, 2019.
-Moore, Sam (August 23, 2019). "Watch Taylor Swift's colourful new video for 'Lover'". NME. Archived from the original on August 27, 2019. Retrieved August 27, 2019.
-Zemler, Emily (June 17, 2019). "Watch Taylor Swift Reunite With Katy Perry in 'You Need to Calm Down' Video". Rolling Stone. Archived from the original on June 17, 2019. Retrieved June 17, 2019.
- Mylrea, Hannah (February 28, 2020). "Every incredible Easter Egg in Taylor Swift's 'The Man' video". NME. Retrieved March 9, 2020.
-Spanos, Brittany; Legaspi, Althea (July 24, 2020). "Taylor Swift Blends Fantastical With Personal in 'Cardigan' Video". Rolling Stone. Retrieved July 27, 2020.
-"Justin Bieber & Megan Thee Stallion Lead 2021 MTV VMA Nominations". Billboard. Retrieved August 17, 2021.
- Weatherby, Taylor (February 5, 2023). "Taylor Swift Makes GRAMMY History (Again) With Best Music Video Win For "All Too Well: The Short Film"". Grammy Awards. Retrieved February 6, 2023.
- Lansky, Sam (December 6, 2023). "Taylor Swift Is TIME's 2023 Person of the Year". Time. Retrieved December 6, 2023.
- "Taylor Swift". The Recording Academy. Archived from the original on August 12, 2016. Retrieved August 3, 2016.
- Friedlander, Whitney (September 10, 2015). "Taylor Swift, Jimmy Fallon Among Juried Emmy Award Winners". Variety. Archived from the original on September 15, 2015. Retrieved August 3, 2016.
- "Taylor Swift dominates AMAs with 6 wins, extending lead as show's most-decorated artist". KTRK-TV. November 21, 2022. Retrieved November 21, 2022.
- Grein, Paul (November 19, 2023). "After the 2023 Billboard Music Awards, Who Is the All-Time Biggest Winner?". Billboard. Retrieved November 19, 2023.
- See Guinness World Records by Taylor Swift
- Lewis, Randy (November 4, 2013). "Taylor Swift to receive rare Pinnacle Award at CMA Awards Nov. 6". Los Angeles Times. Retrieved May 13, 2020.
- "Taylor Swift Nashville Tickets". Excite. Archived from the original on February 3, 2015. Retrieved February 2, 2015.
- Shelburne, Craig (October 18, 2010). "Taylor Swift Named NSAI's Songwriter-Artist of the Year". CMT. Archived from the original on March 14, 2014. Retrieved February 2, 2015.
- "Songwriters Hall of Fame". Songwriters Hall of Fame. Archived from the original on November 29, 2014. Retrieved February 2, 2015.
- "The 100 Greatest Songwriters of All Time". Rolling Stone. Archived from the original on September 2, 2017. Retrieved August 28, 2017.
- Polanco, Luis (April 5, 2016). "Taylor Swift to Receive First-Ever Taylor Swift Award From BMI". Billboard. Retrieved October 21, 2020.
- Jolly, Nathan (November 17, 2019). "Why Taylor Swift is to blame for latest twist in music rights drama". News.com.au. Retrieved November 17, 2019.
- "10 Life mantras by Taylor Swift to live by". India Today. December 13, 2016. Archived from the original on February 9, 2019. Retrieved July 16, 2020.
- Lipshutz, Jason (December 11, 2019). "Billboard Woman of the Decade Taylor Swift: 'I Do Want My Music to Live On'". Billboard. Retrieved December 11, 2019.
- "Taylor Swift to receive BRITs Global Icon award". Official Charts Company. May 9, 2021. Retrieved May 10, 2021.
- "Taylor Swift to receive Global Icon Award!". Brit Awards. May 9, 2021. Retrieved May 10, 2021.
- Paine, Andre (February 22, 2023). "Taylor Swift wins IFPI's 2022 Global Recording Artist Of The Year Award". Music Week. Retrieved February 22, 2023.
- Brandle, Lars (November 5, 2023). "Taylor Swift's '1989 (Taylor's Version)' Debuts at U.K. No. 1 With 'Massive' Sales". Billboard. Retrieved November 5, 2023.
- "Female artists with the most Irish Number 1 albums since 2000". Official Charts Company. November 5, 2020. Retrieved February 23, 2021.
- Wang, Dennis (April 16, 2021). "Taylor Swift's Fearless hits the right note in China, again". People's Daily. Retrieved June 26, 2021.
- Brandle, Lars (July 7, 2023). "Taylor Swift Sets Chart Record In Australia With Top-Five Sweep". Billboard. Retrieved February 13, 2024.
- Brandle, Lars (February 9, 2024). "Ahead of 'The Eras Tour' of Australia, Taylor Swift Sweeps Top 5". Billboard. Retrieved February 13, 2024.
- "Taylor beats Swift". Australian Recording Industry Association. July 14, 2023. Archived from the original on July 14, 2023. Retrieved July 19, 2023.
- "Taylor sweeps the record". Australian Recording Industry Association. July 7, 2023. Retrieved July 7, 2023.
- Cumulative touring gross:
-"Top Touring Artist of the Pollstar Era" (PDF). Pollstar. June 10, 2022. Archived (PDF) from the original on August 5, 2022. Retrieved August 4, 2022.
-Allen, Bob (September 26, 2023). "What A Friggin' Year! 2023 Boxoffice Results Remain At Record Highs". Pollstar. Retrieved October 18, 2023.
- Gensler, Andy (December 8, 2023). "Taylor Swift Sets All-Time Touring Record With $1 Billion Gross". Pollstar. Archived from the original on December 8, 2023. Retrieved December 8, 2023.
- Willman, Chris (December 21, 2020). "Taylor Swift's 'Evermore' Sells a Million Worldwide in First Week". Variety. Archived from the original on January 11, 2021. Retrieved December 21, 2020.
- Paine, Andre (December 22, 2022). "Taylor Swift Achieves More Than 6 Million Global Units for Midnights and 37 Billion Total Streams in 2022". Music Week. Archived from the original on December 22, 2022. Retrieved July 19, 2023.
- Young, Alex (October 31, 2022). "Taylor Swift broke 73 records with release of new album Midnights". Consequence. Archived from the original on October 31, 2022. Retrieved July 19, 2023.
- Grein, Paul (November 8, 2023). "Taylor Swift Is Apple Music's 2023 Artist of the Year". Billboard. Retrieved November 8, 2023.
- Willman, Chris (October 28, 2023). "Taylor Swift Beats Her Own Spotify Record for Most Single-Day Streams for an Artist With '1989 (Taylor's Version)' Release". Variety. Archived from the original on October 29, 2023. Retrieved October 29, 2023.
- @billboardcharts (January 19, 2022). "Most entries on the #Global200 chart in a single week" (Tweet) – via Twitter.
- "Taylor Swift Chart History (Billboard Global 200)". Billboard. Retrieved July 17, 2023.
- "Greatest of All Time Artists". Billboard. Archived from the original on November 14, 2019. Retrieved November 15, 2019.
- Zellner, Xander (January 25, 2024). "Taylor Swift Tallies Record-Extending 95th Week at No. 1 on Artist 100 Chart". Billboard. Retrieved January 26, 2024.
- Caulfield, Keith (December 31, 2023). "Taylor Swift Surpasses Elvis Presley for Most Weeks at No. 1 on Billboard 200 Among Soloists". Billboard. Retrieved January 3, 2024.
- Trust, Gary (January 22, 2024). "Ariana Grande's 'Yes, And?' Debuts at No. 1 on Billboard Hot 100". Billboard. Retrieved January 22, 2024.
- "Taylor Swift Chart History (Top Country Albums)". Billboard. Retrieved July 17, 2023.
- "Taylor Swift Chart History (Digital Song Sales)". Billboard. Retrieved January 14, 2021.
- Trust, Gary (July 28, 2023). "Taylor Swift Breaks Record for Most No. 1s on Pop Airplay Chart As 'Cruel Summer' Becomes Her 12th". Billboard. Archived from the original on September 29, 2023. Retrieved October 19, 2023.
- Caulfield, Keith (December 3, 2023). "Taylor Swift Makes History With Five of the Top 10 Albums on the Billboard 200". Billboard. Retrieved January 3, 2024.
- Caulfield, Keith (July 17, 2023). "Taylor Swift Has 11 Albums on the Billboard 200 Chart for the First Time". Billboard. Retrieved July 19, 2023.
- McIntyre, Hugh (January 22, 2024). "Taylor Swift Made Billboard History–Now Only She Can Match Her Own Feat". Forbes. Retrieved January 22, 2024.
- Caulfield, Keith (December 29, 2023). "Taylor Swift Has the Top Four on the Album Sales Chart for the First Time". Billboard. Retrieved January 3, 2024.
- Caulfield, Keith (January 3, 2024). "Taylor Swift Has 7 of the Top 10 on Billboard's Album Sales Chart". Billboard. Retrieved January 23, 2024.
- "RIAA – Top Artists (Digital Singles)". Recording Industry Association of America. Retrieved July 17, 2023.
- Ahlgrim, Callie (July 12, 2023). "There are 116 songs in history that have been certified diamond — here they all are". Insider Inc. Retrieved July 17, 2023.
- Caulfield, Keith (October 30, 2022). "Taylor Swift's Midnights Blasts in at No. 1 on Billboard 200 Chart With Biggest Week for an Album in 7 Years". Billboard. Retrieved October 30, 2022.
- Nicks, Stevie (April 29, 2010). "The 2010 Time 100: Taylor Swift". Time. Archived from the original on November 29, 2013. Retrieved April 22, 2012.
-Vena, Jocelyn (April 16, 2015). "Taylor Swift, Kanye West, Kim Kardashian Make Time's 100 Most Influential People List". Billboard. Archived from the original on September 25, 2016. Retrieved September 1, 2016.
-Jensen, Erin (April 17, 2019). "Dwayne Johnson, Taylor Swift, Gayle King, more cover Time's 100 most influential people issue". USA Today. Archived from the original on April 17, 2019. Retrieved April 17, 2019.
- Dockterman, Eliana (December 6, 2017). "'I Was Angry.' Taylor Swift on What Powered Her Sexual Assault Testimony". Time. Archived from the original on December 6, 2017. Retrieved December 7, 2017.
- Shah, Simmone (December 6, 2023). "Taylor Swift Makes History as Person of the Year". Time. Retrieved December 6, 2023.
- "Taylor Swift Is TIME's 2023 Person of the Year". Time. December 6, 2023. Retrieved December 11, 2023.
- "Taylor Swift". Forbes. Retrieved December 1, 2020.
- "30 Under 30 2017: All-Star Alumni". Forbes. Retrieved December 1, 2020.
- "#8 Taylor Swift". Forbes. Archived from the original on July 28, 2015. Retrieved July 27, 2015.
- "Forbes Unveils Its 20th Annual Ranking Of The World's Most Powerful Women". Forbes. December 5, 2023. Retrieved December 5, 2023.
- Schneider, Marc (July 24, 2023). "8 Ways Taylor Swift Has Changed the Music Business". Billboard. Retrieved July 24, 2023.
- Khan, Fawzia (June 18, 2021). "The Might Of Taylor Swift". Elle. Archived from the original on June 28, 2021. Retrieved October 20, 2021.
- Pattison, Kate (September 19, 2023). "How did Taylor Swift get so popular? She never goes out of style". The Conversation. Retrieved September 22, 2023.
- Grady, Constance (October 12, 2023). "The Eras concert movie is Taylor Swift leveling up". Vox. Retrieved October 13, 2023.
- Jericho, Greg (October 28, 2022). "Taylor Swift's incredible success in graphs – who can blame me for being a Swiftie as a 50-year-old man?". The Guardian. Retrieved October 29, 2022.
- Weatherhead, Shaina (April 20, 2023). "Taylor Swift's 'Miss Americana' Is Required Viewing Right Now". Collider. Retrieved April 24, 2023.
- Bartsch, Kayla (September 24, 2023). "Taylor Swift: Empress of the Zeitgeist". National Review. Retrieved September 24, 2023.
- "Taylor Swift: 'My Confidence Is Easy To Shake'". NPR. November 2, 2012. Retrieved May 20, 2021.
-Thanki, Juli (September 24, 2015). "Taylor Swift: Teen idol to 'biggest pop artist in the world'". The Tennessean. Retrieved May 13, 2021.
-Yahr, Emily (June 16, 2016). "Taylor Swift's first song came out 10 years ago. Here's what she was like as a teen songwriter". Arts and Entertainment. The Washington Post. Archived from the original on May 13, 2021. Retrieved May 13, 2021.
- El Mosselli, Sabrina (December 24, 2022). "How Taylor Swift rose from 'Miss Americana' to global megastar". Le Monde. Retrieved December 28, 2022.
- Cragg, Michael. "Is Taylor Swift our last remaining real popstar?". i-D. Archived from the original on May 6, 2023. Retrieved December 3, 2022.
- Seisdedos, Iker (December 27, 2022). "Pop music in the era of Taylor Swift: Behind the success of today's biggest star". El País. Retrieved December 28, 2022.
- Sanders, Sam (October 20, 2022). "Taylor Swift Is the Greatest Self-Portraitist of Our Time". Vulture. Retrieved October 21, 2022.
- "Taylor Swift's 40 Biggest Hot 100 Hits". Billboard. March 23, 2022. Retrieved April 12, 2022.
- Leonard, Devin (November 12, 2014). "Taylor Swift Is the Music Industry". Bloomberg News. Archived from the original on March 13, 2016. Retrieved August 11, 2020.
- Zoladz, Lindsay (December 30, 2019). "What Were the 2010s?". New York. Retrieved November 22, 2020.
- Savaira, Augusta (November 23, 2022). "Welcome to 'Swiftonomics': What Taylor Swift reveals about the U.S. economy". Los Angeles Times. Retrieved November 23, 2022.
- Vincent, Alice (November 3, 2017). "Taylor Swift: the rise, fall and re-invention of America's sweetheart". The Daily Telegraph. Archived from the original on January 10, 2022. Retrieved July 5, 2020.
- Fischer & Seidman 2016, p. 529.
- Wahi, Sukriti (March 3, 2021). "Every Time Taylor Swift Perfectly Shut Down A Sexist Interview Question". Elle. Retrieved November 4, 2021.
- Davis, Allison P. (June 28, 2018). "The Taylor Swift Slut-Shaming Continues". The Cut. Retrieved November 4, 2021.
- Meddings, Jacqui (October 31, 2014). "Taylor Swift is our new cover goddess". Cosmopolitan. Archived from the original on July 14, 2016. Retrieved August 2, 2016.
- Chiu, Allyson (August 3, 2022). "Celebrities use private jets excessively. It's a climate nightmare". Washington Post. ISSN 0190-8286. Retrieved February 14, 2024.
- Mendez, Lola (February 14, 2024). "Taylor Swift claims she offsets her travel carbon footprint - how does that work?". BBC. Retrieved February 14, 2024.
- O'Malley, Isabella (February 2, 2024). "Why Taylor Swift's globe-trotting in private jets is getting scrutinized". Associated Press. Retrieved February 6, 2024.
- "Taylor Swift and Travis Kelce romance is bad for the planet. Couple burns a whopping $70,779 jet fuel in the last three months". The Economic Times. December 21, 2023. Retrieved February 6, 2024.
- Blistein, Jon (February 6, 2024). "Taylor Swift's Lawyers Threaten Private Jet Flight Tracker Over 'Stalking and Harassing Behavior'". Rolling Stone. Retrieved February 6, 2024.
- Matza, Max (February 7, 2024). "Taylor Swift threatens to sue student who tracks her private jet". BBC News. Retrieved February 7, 2024.
- Benitez-Eves, Tina (July 2, 2022). "Man Arrested for Harassing Taylor Swift, Attempting to Break Into Her New York City Apartment". American Songwriter. Retrieved June 10, 2023.
- Kreps, Daniel (July 2, 2022). "Brooklyn Man Arrested on Charges of Stalking Taylor Swift". Rolling Stone. Retrieved June 10, 2023.
- Della Cava, Marco; Ryan, Patrick (August 31, 2023). "Taylor Swift is 'in a class of her own right now,' as Eras tour gives way to Eras movie". USA Today. Archived from the original on September 1, 2023. Retrieved September 1, 2023.
- Crummy, Colin (March 13, 2014). "Detwanging country music: how Nashville took the UK". The Guardian. Retrieved September 23, 2021.
- Roland, Tom (July 7, 2016). "Love Story: The Impact of Taylor Swift's First Decade in Music". Billboard. Archived from the original on July 14, 2016. Retrieved July 7, 2016.
- Tannembaum, Rob (September 12, 2014). "4 Ways Billboard Woman of the Year Taylor Swift Changed Country Music". Billboard. Retrieved December 31, 2019.
- O'Connor, Roisin (October 18, 2018). "Half of all new guitar players are women, finds study". The Independent. Archived from the original on May 26, 2022. Retrieved October 20, 2020.
- Wang, Amy X. (May 22, 2018). "Guitars Are Getting More Popular. So Why Do We Think They're Dying?". Rolling Stone. Retrieved October 20, 2020.
- "The 200 Most Important Artists of Pitchfork's First 25 Years". Pitchfork. October 4, 2021. Retrieved October 4, 2021.
- Lipshutz, Jason (December 16, 2021). "Billboard's Greatest Pop Stars of 2021: No. 1 — Taylor Swift". Billboard. Retrieved December 16, 2021.
- Catucci, Nick (August 23, 2019). "Taylor Swift Reaches For New Heights of Personal and Musical Liberation on 'Lover'". Rolling Stone. Retrieved August 18, 2021.
- Gormely, Ian (December 3, 2014). "Taylor Swift leads poptimism's rebirth". The Guardian. Retrieved August 2, 2021.
- Gambles, Sarah (July 23, 2023). "The ubiquitous power of Taylor Swift". Deseret News. Retrieved September 7, 2023.
- Friedman, Vanessa (April 24, 2023). "Taylor Swift and the Sparkling Trap of Constant Reinvention". The New York Times. Retrieved September 7, 2023.
- Rowley, Glenn (March 9, 2023). "Taylor Swift's 'All Too Well (10 Minute Version)' Is Now a Class at Stanford University". Billboard. Retrieved March 10, 2023.
- Ahlgrim, Callie (March 18, 2022). "How Taylor Swift inspired a new generation of singer-songwriters, in their own words". Business Insider. Retrieved March 18, 2022.
- Sutherland, Mark (December 13, 2019). "'I come with opinions about how we can better our industry': Taylor Swift". Music Week. Retrieved April 27, 2020.
-Sisario, Ben (November 6, 2014). "Sales of Taylor Swift's '1989' Intensify Streaming Debate". The New York Times. Retrieved August 11, 2020.
-Rosseinsky, Katie (October 29, 2021). "How Taylor Swift is changing the music industry a re-record at a time". Evening Standard. Archived from the original on April 9, 2021. Retrieved April 23, 2021.
- Smith, Neil (June 22, 2015). "Five ways Taylor Swift is changing the world". BBC News. Retrieved December 31, 2019.
- Brooks, Dave (November 3, 2022). "How Taylor Swift Changed the Course of the Concert Ticketing Businesses". Billboard. Retrieved November 4, 2022.
- Sources on Swift and millennial era
- • McDuling, John (November 3, 2014). "Why Taylor Swift is the most important artist of the millennial era". Quartz. Archived from the original on June 2, 2021. Retrieved April 2, 2021.
- • "What Taylor Swift tells us about millennials". National Post. October 6, 2015. Retrieved October 30, 2021.
- • Kidd, Joel (March 2, 2020). "Taylor Swift Is the Surprising Face of Millennial Anxiety". The Walrus. Retrieved October 30, 2021.
- • Winograd, Morley; D. Hais, Michael (January 29, 2010). "Move over Kanye West, Taylor Swift and the Millennial generation are taking over music". The Christian Science Monitor. Retrieved October 30, 2021.
- • "The 17 Musicians Gen Z & Millennials Say Represent Their Generations". YPulse. October 8, 2019. Retrieved October 30, 2021.
- • Nicolau, Elena (November 29, 2022). "How Taylor Swift is transforming millennial weddings". Today. Retrieved November 30, 2022.
- • "Taylor Swift is peak millennial vibes". NPR. October 21, 2022. Retrieved December 19, 2022.
- VanDerWerff, Emily (July 31, 2020). "Taylor Swift is the millennial Bruce Springsteen". Vox. Retrieved October 30, 2021.
- Ditum, Sarah (October 8, 2022). "Taylor Swift: the Bob Dylan of our age". The Times. Archived from the original on December 24, 2022. Retrieved October 9, 2022.
- "Taylor Swift Will Receive First-Ever Woman of the Decade Honor at Billboard's Women in Music". Billboard. November 18, 2019. Retrieved December 31, 2019.
- Elizabeth, De (November 24, 2019). "Taylor Swift Is Named Artist of the Decade at AMAs 2019". Teen Vogue. Retrieved December 31, 2019.
- Kemp, Sam (January 27, 2022). "The surprising Paul McCartney song inspired by Taylor Swift". Far Out. Retrieved July 5, 2023.
- Golsen, Tyler (May 14, 2023). "Mick Jagger discusses his performance with Taylor Swift". Far Out. Retrieved July 5, 2023.
- Brandle, Lars (January 28, 2015). "Taylor Swift on Madonna Praise: 'Now I'm Dead'". Billboard. Retrieved July 5, 2023.
- Aniftos, Rania (January 27, 2021). "Dolly Parton Says Taylor Swift Is 'Magnificent' Following Damon Albarn Feud: 'She Knows Who She Is'". Billboard. Retrieved July 5, 2023.
- Graff, Gary (October 31, 2021). "Taylor Swift Helps Induct Carole King, Sings "Will You Love Me Tomorrow" at Rock Hall Ceremony". The Hollywood Reporter. Retrieved September 20, 2022.
- Skinner, Tom (November 2, 2022). "Bruce Springsteen praises Taylor Swift's new album 'Midnights': "She's a tremendous writer"". NME. Retrieved July 5, 2023.
- Ruggieri, Melissa (November 3, 2021). "Billy Joel says Taylor Swift is like the Beatles of her generation: 'She knows music'". USA Today. Retrieved July 5, 2023.
- Williams, Joe (July 5, 2023). "Ringo Starr says Taylor Swift is "biggest star in the world"". Far Out. Retrieved July 5, 2023.
- Iasimone, Ashley (November 12, 2023). "Britney Spears Shares Throwback Photo With Taylor Swift From 20 Years Ago: 'Most Iconic Pop Woman of Our Generation'". Billboard. Retrieved November 12, 2023.
- Lutz, Ashley (October 8, 2022). "Taylor Swift's new album proves she is a business genius". Fortune. Retrieved October 8, 2022.
- Steele, Anne (July 1, 2023). "How to Succeed in Business Like Taylor Swift". The Wall Street Journal. Retrieved July 2, 2023.
- Lynch, Joe (January 31, 2024). "Taylor Swift Tops Billboard's Annual Power 100 List for the First Time". Billboard. Retrieved January 31, 2024.
- Curto, Justin (December 22, 2020). "Did 2020 Kill the Long, Fancy Pop-Album Rollout for Good?". Vulture. Archived from the original on December 23, 2020. Retrieved December 27, 2020.
- Leight, Elias (July 23, 2020). "Taylor Swift Finally Abandoned the Traditional Album Rollout". Rolling Stone. Retrieved September 15, 2022.
- Kheraj, Alim (November 9, 2022). "The curate's Easter egg: how Taylor Swift turned pop into a multiplayer puzzle". The Guardian. Retrieved November 9, 2022.
- Tannenbaum, Emily. "Taylor Swift Hid a Bunch of Easter Eggs in the All Too Well Short Film". Glamour. Retrieved May 13, 2022.
- Suskind, Alex (May 9, 2019). "New Reputation: Taylor Swift shares intel on TS7, fan theories, and her next era". Entertainment Weekly. Archived from the original on August 12, 2019. Retrieved May 13, 2022.
- Yahr, Emily (December 26, 2022). "2022: The year in review (Taylor's version)". The Washington Post. Retrieved December 26, 2022.
- Stein, Jeannine (November 18, 2011). "Taylor Swift weighs in on being a role model". Los Angeles Times. Archived from the original on July 15, 2012. Retrieved April 18, 2012.
- Collins, Katie (June 8, 2018). "How Taylor Swift flipped online fandom on its head for the better". CNET. Retrieved March 19, 2023.
- King, Ashley (July 21, 2023). "Taylor Swift's 13 Management is Rarely Discussed, Changes Abound". Digital Music News. Retrieved September 23, 2023.
- Yotka, Steff (August 20, 2019). "Taylor Swift and Stella McCartney Reveal Their Lover Fashion Collaboration". Vogue. Retrieved October 20, 2020.
- Kaplan, Julee (January 29, 2009). "Taylor Swift Launches Sundress Line – Ready-to-Wear and Sportswear – Media". Women's Wear Daily. Archived from the original on July 29, 2013. Retrieved August 7, 2012.
- "Taylor Swift to have greeting card line". USA Today. November 18, 2009. Archived from the original on December 14, 2009. Retrieved August 7, 2012.
- Serpe, Gina (October 29, 2008). "Taylor Swift Gets All Dolled Up". E! News (Blog). Archived from the original on March 5, 2011. Retrieved September 20, 2010.
- Mychaskiw, Marianne (October 1, 2014). "Taylor Swift Is Launching Her Fourth Fragrance!". InStyle. Archived from the original on January 7, 2015. Retrieved December 3, 2015.
- McIntyre, Hugh. "Taylor Swift Has Signed A Multi-Year Deal With AT&T". Forbes. Archived from the original on September 11, 2018. Retrieved September 11, 2018.
- Chiu, Melody (July 26, 2019). "Watch Taylor Swift Hilariously Moonlight — and Fail — as a Bartender and Server in New Commercial". People. Retrieved May 7, 2022.
- "Taylor Swift: NHL's New Spokesperson". AOL. February 3, 2009. Archived from the original on February 7, 2009. Retrieved September 20, 2010.
- "Sony Electronics News and Information". Sony. April 26, 2010. Retrieved August 7, 2012.
- Lee, Ashley (October 27, 2014). "Taylor Swift Named New York City Welcome Ambassador". Billboard. Retrieved September 26, 2023.
- Kaufman, Gil (January 20, 2022). "Taylor Swift Tapped as First Record Store Day Global Ambassador". Billboard. Retrieved January 20, 2022.
- Snapes, Laura (August 24, 2019). "Taylor Swift: 'Pop music can feel like it's The Hunger Games, and like we're gladiators'". The Guardian. Archived from the original on August 24, 2019. Retrieved August 24, 2019.
- "The Original 300+ Time's Up Signatories". Time's Up. October 21, 2019. Archived from the original on May 3, 2020. Retrieved May 20, 2020.
- Mier, Tomás (June 24, 2022). "Taylor Swift Says She's 'Absolutely Terrified' After Roe v. Wade Decision". Rolling Stone. Retrieved June 24, 2022.
- "Taylor Swift sends 'love' and 'respect' to LGBT fans". BBC News. June 4, 2018. Archived from the original on November 14, 2018. Retrieved December 15, 2018.
- Kreps, Daniel (June 1, 2019). "Taylor Swift Urges Senate to Pass Equality Act in Letter to Tennessee Senator". Rolling Stone. Retrieved August 12, 2020.
- Lynch, Joe (June 26, 2020). "Taylor Swift Calls Out U.S. Census for Transgender Erasure". Billboard. Retrieved June 29, 2020.
- Lynch, Joe (June 14, 2019). "Taylor Swift Wishes NYC's Stonewall Inn 'Happy Pride' at Surprise Set". Billboard. Retrieved August 7, 2022.
- Aniftos, Rania (April 8, 2019). "Taylor Swift Donates $113,000 to Tennessee Equality Project to Fight Anti-LGBTQ Bills". Billboard. Archived from the original on April 9, 2019. Retrieved April 9, 2019.
- "Taylor Swift Makes a Generous Donation to GLAAD in Support of the LGBTQ Community" (Press release). GLAAD. June 1, 2019. Archived from the original on June 1, 2019. Retrieved June 1, 2019.
- Lynch, John (March 23, 2018). "Taylor Swift Shares Support For Gun a Control Reform In Instagram Post". Business Insider. Retrieved May 20, 2020.
- Hiatt, Brian (September 18, 2019). "The Rolling Stone Interview Taylor Swift". Rolling Stone. Archived from the original on September 18, 2019. Retrieved September 19, 2019.
- Bailey, Alyssa (June 9, 2020). "Taylor Swift Tweeted About the Black Lives Matter Movement and Urged People to Vote". Elle. Retrieved July 27, 2020.
- Kreps, Daniel (June 12, 2020). "Taylor Swift Calls for Removal of Monuments That 'Celebrate Racist Historical Figures'". Rolling Stone. Retrieved August 12, 2020.
- France, Lisa Respers (June 19, 2020). "Taylor Swift got educated on Juneteenth and wants you to be, too". CNN. Retrieved July 27, 2020.
- Haag, Matthew (October 9, 2018). "Voter Registrations Spike as Deadlines Loom. Taylor Swift Had Something to Do With It". The New York Times. Archived from the original on October 9, 2018. Retrieved October 10, 2018.
- Stevens, Matt (October 7, 2020). "Taylor Swift, leaning further into politics, endorses Joe Biden and Kamala Harris". The New York Times. Archived from the original on October 7, 2020. Retrieved October 8, 2020.
- Schuster, Steve (May 19, 2023). "Taylor Swift comes out against Trump, again". Wisconsin Law Journal. Retrieved November 4, 2023.
- Dellatto, Marisa (October 27, 2023). "Taylor Swift's New Era: The Pop Star Becomes A Billionaire". Forbes. Retrieved October 29, 2023.
- Pendleton, Devon; Ballentine, Claire; Patino, Marie; Whiteaker, Chloe; Li, Diana (October 26, 2023). "Taylor Swift Vaults Into Billionaire Ranks With Blockbuster Eras Tour". Bloomberg News. Retrieved October 26, 2023.
- Greenburg, Zack O'Malley (November 2, 2016). "The World's Highest-Paid Women in Music 2016". Forbes. Archived from the original on May 25, 2019. Retrieved July 13, 2019.
-Greenburg, Zack O'Malley (December 6, 2019). "The World's Top-Earning Musicians Of 2019". Forbes. Retrieved July 29, 2022.
-Voytko, Lisette (February 9, 2022). "The Highest-Paid Entertainers 2022". Forbes. Retrieved July 29, 2022.
-Voytko, Lisette (February 13, 2023). "The World's 10 Highest-Paid Entertainers". Forbes. Retrieved July 29, 2022.
- "Highest annual earnings ever for a female pop star". Guinness World Records. Archived from the original on November 12, 2017. Retrieved November 15, 2017.
- Mercuri, Monica (July 10, 2019). "Taylor Swift Is The World's Highest-Paid Celebrity With $185 Million in 2019". Forbes. Archived from the original on July 12, 2019. Retrieved July 13, 2019.
-Greenburg, Zack O'Malley (July 11, 2016). "Taylor Swift Is The World's Top-Earning Celebrity With $170 Million in 2016". Forbes. Archived from the original on August 3, 2016. Retrieved August 3, 2016.
- Greenburg, Zack O'Malley (December 23, 2019). "From Taylor Swift To Dr. Dre: The 10 Top-Earning Musicians Of The Decade". Forbes. Archived from the original on December 30, 2019. Retrieved December 31, 2019.
- Silva, Rachel; Tonelli, Lucia (October 3, 2023). "Inside Taylor Swift's 8 Incredible Homes". Elle Decoration. Retrieved October 12, 2023.
- Dailey, Hannah; Aniftos, Rania (December 21, 2023). "A Timeline of Taylor Swift's Generosity". Billboard. Retrieved December 24, 2023.
- Couch, Robbie (March 2, 2015). "Taylor Swift Named Most Charitable Celeb For Supporting Feminist Causes, Education, More". HuffPost. Archived from the original on October 21, 2016. Retrieved August 2, 2016.
- Pacella, Megan (June 13, 2012). "Taylor Swift Receives Star of Compassion Award". Taste of Country. Archived from the original on July 13, 2015. Retrieved November 27, 2015.
- Cooper, Brittany Joy (March 27, 2012). "Taylor Swift to Receive 'Big' Honor From Michelle Obama at Kids' Choice Awards". Taste of Country. Archived from the original on July 12, 2012. Retrieved August 30, 2012.
- Lee, Ken (August 9, 2009). "Taylor Swift donates $100,000 to victims of Iowa Flood". People. Archived from the original on June 7, 2009. Retrieved September 9, 2009.
- "How Taylor Swift helps people worldwide". Borgen. February 2, 2023. Retrieved June 17, 2023.
- Moran, Jonathon (March 8, 2009). "Kylie to play at Sound Relief with Coldplay, Midnight Oil". The Daily Telegraph. Archived from the original on October 10, 2016. Retrieved December 30, 2009.
- "Taylor Swift donates $500,000 after Nashville floods". BBC News. May 7, 2010. Retrieved May 7, 2022.
- Lewis, Randy (May 23, 2011). "Taylor Swift benefit concert raises more than $750,000 for tornado victims". Los Angeles Times (Blog). Archived from the original on April 6, 2012. Retrieved April 18, 2012.
- "Taylor Swift gives $1m to help Louisiana flood relief efforts". The Guardian. August 17, 2016. Archived from the original on August 17, 2016. Retrieved August 17, 2016.
- Muhammad, Latifah (December 9, 2016). "Taylor Swift Donates $100,000 to Dolly Parton Fire Fund". Entertainment Tonight. Archived from the original on January 13, 2017. Retrieved January 11, 2017.
- Blair, Olivia (September 4, 2019). "Taylor Swift Makes 'Very Sizeable Donation' To A Food Bank in Houston After Hurricane Harvey". Elle. Archived from the original on July 2, 2019. Retrieved July 3, 2019.
- Rowley, Glenn (April 13, 2023). "Taylor Swift Donated Enough to Feed 'Over 125,000' at Tampa Food Bank Ahead of The Eras Tour Stop". Billboard. Archived from the original on April 21, 2023. Retrieved May 11, 2023.
- Dementri, Nikki (May 16, 2023). "'It's a blessing': South Philly pizza, cheesesteak shop thankful for T. Swift's business". CBS News. Archived from the original on May 17, 2023. Retrieved May 17, 2023.
- Grow, Kory (August 3, 2023). "Taylor Swift Is Helping Truck Drivers Buy First Homes With $100,000 Bonuses". Rolling Stone. Retrieved August 3, 2023.
- Paulson, Dave (March 5, 2020). "Taylor Swift donates $1 million for Tennessee tornado relief". The Tennessean. Retrieved March 5, 2020.
- Ruggieri, Melissa. "Taylor Swift donates $1 million to help communities ravaged by Tennessee tornadoes". The Tennessean. Retrieved December 11, 2023.
- "Nashville Songwriters Hall of Fame". Nashville Songwriters Foundation. Retrieved July 2, 2020.
- "Taylor Swift becomes namesake of Hendersonville High School auditorium". The Tennessean. September 23, 2010. Archived from the original on July 12, 2015. Retrieved May 29, 2011.
- McKinley, James C. (May 17, 2012). "Taylor Swift to Donate $4 Million to the Country Hall of Fame". The New York Times. Archived from the original on June 5, 2012. Retrieved July 1, 2012.
- Golden, Zara (October 1, 2012). "And The Taylor Swift VH1 Storytellers Contest Winner Is ... Harvey Mudd College!". VH1. Archived from the original on July 12, 2015. Retrieved April 21, 2014.
- "$100,000 Gift from Taylor Swift Provides Vital Support to Nashville Symphony". Nashville Symphony. December 16, 2013. Retrieved April 7, 2020.
- Sanz, Cynthia (December 14, 2009). "Taylor Swift Gives Big as She Turns 20 – Good Deeds, Taylor Swift". People. Archived from the original on June 17, 2012. Retrieved May 29, 2012.
-Urban, Mike (October 14, 2011). "Taylor Swift donates 6,000 books to Reading Library". Reading Eagle. Archived from the original on May 12, 2012. Retrieved May 29, 2012.
-Zhu, Danielle (November 17, 2015). "Taylor Swift partners with Scholastic to donate 25,000 books". Entertainment Weekly. Archived from the original on August 14, 2016. Retrieved August 3, 2016.
- Cooper, Brittany Joy (February 2, 2012). "Taylor Swift Donates 14,000 Books to Nashville Public Library". Taste of Country. Archived from the original on June 17, 2012. Retrieved May 29, 2012.
- "Taylor Swift Helps With 'Delete Online Predators' Campaign". Country Weekly. September 18, 2007. Archived from the original on January 16, 2016. Retrieved November 29, 2015.
- "Taylor Swift Teams Up With UNICEF Tap Project Initiative". Taste of Country. March 17, 2011. Archived from the original on May 1, 2013. Retrieved August 7, 2012.
-"Taylor Swift Among Participants in MusiCares Back To School Charity Auction". RTTNews. July 28, 2011. Archived from the original on May 17, 2013. Retrieved August 7, 2012.
- "Taylor Swift and ACM Lifting Lives present $50,000 donation to St. Jude". The Tennessean. June 13, 2011. Archived from the original on July 12, 2015. Retrieved May 29, 2012.
- "New and Hot Video: Taylor Swift Debuts 'Ronan' at Stand Up To Cancer Benefit". Rolling Stone. September 8, 2012. Archived from the original on September 13, 2012. Retrieved September 14, 2012.
- Knight, Joey (May 17, 2014). "Dick Vitale holds annual fundraiser for pediatric cancer". Tampa Bay Times. Archived from the original on July 14, 2014. Retrieved July 30, 2014.
- George, John. "Taylor Swift donates $50K to CHOP to help teens with cancer". The Business Journals (Blog). Archived from the original on July 12, 2015. Retrieved June 5, 2014.
- Hardiman, Tim (April 20, 2007). "Taylor Swift Encourages Teen Volunteers". CMT. Archived from the original on November 13, 2012. Retrieved July 1, 2012.
- Vagianos, Alanna (August 17, 2017). "This Is How Taylor Swift's Donations Will Impact Sexual Assault Survivors". HuffPost. Retrieved April 7, 2020.
- Peppin, Hayley (March 24, 2020). "Taylor Swift responded to the leaked 'Famous' phone call with Kanye West by urging fans to instead focus on coronavirus aid". Insider Inc. Retrieved May 13, 2020.
- Grow, Kory (April 1, 2020). "How Taylor Swift Is Helping a Small Nashville Record Store Survive". Rolling Stone. Retrieved August 1, 2023.
- Hissong, Samantha (August 20, 2020). "Taylor Swift Starts Frenzy at Indie Record Stores With Surprise Signed 'Folklore' CDs". Rolling Stone. Retrieved August 1, 2023.
- Havens, Lyndsey (April 18, 2020). "Taylor Swift Sings Heart-Rending 'Soon You'll Get Better' During 'One World' Concert". Billboard. Retrieved April 19, 2020.
- @RAINN (April 8, 2021). "In 2017, @taylorswift13 fearlessly shared her story of sexual assault in court. In honor of Sexual Assault Awareness & Prevention Month & #RAINNDay, Taylor Swift has made a generous gift to RAINN. Thank you for helping us ensure all survivors are believed and supported! https://t.co/oE7P1BVnNJ" (Tweet). Retrieved April 21, 2021 – via Twitter.
- "Taylor Swift's cash gift helps student take up degree". BBC News. August 20, 2020. Retrieved November 9, 2020.
- M Holloway, Sophie (December 14, 2023). "Taylor Swift and Selena Gomez among celebrities attending Gaza aid fundraiser". The Independent.
-Cited literature
-Fischer, Nancy; Seidman, Steven (2016). Introducing the New Sexuality Studies (3rd ed.). Routledge. ISBN 978-1-317-44918-8. OCLC 953030187.
-Fogarty, Mary; Arnold, Gina (2021). "Are You Ready for It? Re-Evaluating Taylor Swift". Contemporary Music Review. 40 (1): 1–10. doi:10.1080/07494467.2021.1976586.
-Fulford, Phyllis (2014). An Idiots Guide: Singing Second Edition. Penguin Publishing. ISBN 978-1-61564-622-7.
-Hughes, Charles (2017). "Country Music and the Recording Industry". In Stimeling, Travis D. (ed.). The Oxford Handbook of Country Music. Oxford University Press. pp. 205–228. ISBN 978-0-19-024817-8.
-Jepson, Louisa (2013). Taylor Swift. Simon & Schuster. ISBN 978-1-4711-3087-8.
-McNutt, Myles (2020). "From 'Mine' to 'Ours': Gendered Hierarchies of Authorship and the Limits of Taylor Swift's Paratextual Feminism". Communication, Culture and Critique. 13 (1): 72–91. doi:10.1093/ccc/tcz042.
-McGrath, John (2023). "The Return to Craft: Taylor Swift, Nostalgia, and Covid-19". Popular Music and Society. 46 (1): 70–84. doi:10.1080/03007766.2022.2156761.
-Perone, James E. (2017). The Words and Music of Taylor Swift. The Praeger Singer-Songwriter Collection. ABC-Clio. ISBN 978-1-4408-5294-7.
-Provenzano, Catherine (2018). "Auto-Tune, Labor, and the Pop-Music Voice". In Fink, Robert; Latour, Melinda; Wallmark, Zachary (eds.). The Relentless Pursuit of Tone: Timbre in Popular Music. Oxford University Press. pp. 159–182. ISBN 978-0-19-998522-7.
-Sloan, Nate (2021). "Taylor Swift and the Work of Songwriting". Contemporary Music Review. Routledge. 40 (1): 11–26. doi:10.1080/07494467.2021.1945226. S2CID 237695045.
-External links
-Taylor Swift
-at Wikipedia's sister projects
-Media from Commons
-News from Wikinews
-Quotations from Wikiquote
-Data from Wikidata
-Official website Edit this at Wikidata
-Taylor Swift at AllMusic Edit this at Wikidata
-Taylor Swift discography at Discogs Edit this at Wikidata
-Taylor Swift at IMDb Edit this at Wikidata
-Taylor Swift discography at MusicBrainz Edit this at Wikidata
-vte
-Taylor Swift
-vte
-Taylor Swift songs
-Awards for Taylor Swift
-vte
-IFPI Global Year-End Charts
-vte
-Billboard Year-End number one albums
-vte
-Billboard Year-End Top Artist
-Portals:
- Biography
-icon Pop music
-flag Pennsylvania
-flag United States
-Authority control databases Edit this at Wikidata
-Categories: Taylor Swift1989 birthsLiving people21st-century American actresses21st-century American philanthropists21st-century American songwriters21st-century American women guitarists21st-century American women pianists21st-century American women singers21st-century women philanthropistsActresses from Nashville, TennesseeActresses from PennsylvaniaAmerican acoustic guitaristsAmerican billionairesAmerican country banjoistsAmerican country guitaristsAmerican country pianistsAmerican country record producersAmerican country singer-songwritersAmerican feministsAmerican film actressesAmerican folk guitaristsAmerican folk musiciansAmerican folk singersAmerican mezzo-sopranosAmerican multi-instrumentalistsAmerican music video directorsAmerican people of English descentAmerican people of German descentAmerican people of Italian descentAmerican people of Scottish descentAmerican pop guitaristsAmerican pop pianistsAmerican synth-pop musiciansAmerican television actressesAmerican voice actressesAmerican women country singersAmerican women guitaristsAmerican women philanthropistsAmerican women pop singersAmerican women record producersAmerican women rock singersAmerican women singer-songwritersAmerican women songwritersBig Machine Records artistsBrit Award winnersChristians from TennesseeCountry musicians from PennsylvaniaCountry musicians from TennesseeCountry pop musiciansFemale billionairesFemale music video directorsFeminist musiciansFilm directors from PennsylvaniaFilm directors from TennesseeGrammy Award winnersGuitarists from PennsylvaniaGuitarists from TennesseeMTV Europe Music Award winnersMTV Video Music Award winnersNME Awards winnersPeople from Bucks County, PennsylvaniaPhilanthropists from PennsylvaniaPhilanthropists from TennesseePrimetime Emmy Award winnersRCA Records artistsRecord producers from PennsylvaniaRecord producers from TennesseeRepublic Records artistsSinger-songwriters from PennsylvaniaSinger-songwriters from TennesseeSingers from Nashville, TennesseeSony Music Publishing artistsSynth-pop singersTime Person of the YearUniversal Music Group artistsBaldi family
-This page was last edited on 16 February 2024, at 11:33 (UTC).
-Text is available under the Creative Commons Attribution-ShareAlike License 4.0; additional terms may apply. By using this site, you agree to the Terms of Use and Privacy Policy. Wikipedia® is a registered trademark of the Wikimedia Foundation, Inc., a non-profit organization.
-Privacy policyAbout WikipediaDisclaimersContact WikipediaCode of ConductDevelopersStatisticsCookie statementMobile view
-Wikimedia FoundationPowered by MediaWiki
\ No newline at end of file
diff --git a/smolbpe/data/text.py b/smolbpe/data/text.py
deleted file mode 100644
index e94df1b..0000000
--- a/smolbpe/data/text.py
+++ /dev/null
@@ -1 +0,0 @@
-text = """A Programmer’s Introduction to Unicode March 3, 2017 · Coding · 22 Comments  Ｕｎｉｃｏｄｅ! 🅤🅝🅘🅒🅞🅓🅔‽ 🇺\u200c🇳\u200c🇮\u200c🇨\u200c🇴\u200c🇩\u200c🇪! 😄 The very name strikes fear and awe into the hearts of programmers worldwide. We all know we ought to “support Unicode” in our software (whatever that means—like using wchar_t for all the strings, right?). But Unicode can be abstruse, and diving into the thousand-page Unicode Standard plus its dozens of supplementary annexes, reports, and notes can be more than a little intimidating. I don’t blame programmers for still finding the whole thing mysterious, even 30 years after Unicode’s inception.  A few months ago, I got interested in Unicode and decided to spend some time learning more about it in detail. In this article, I’ll give an introduction to it from a programmer’s point of view.  I’m going to focus on the character set and what’s involved in working with strings and files of Unicode text. However, in this article I’m not going to talk about fonts, text layout/shaping/rendering, or localization in detail—those are separate issues, beyond my scope (and knowledge) here.  Diversity and Inherent Complexity The Unicode Codespace Codespace Allocation Scripts Usage Frequency Encodings UTF-8 UTF-16 Combining Marks Canonical Equivalence Normalization Forms Grapheme Clusters And More… Diversity and Inherent Complexity As soon as you start to study Unicode, it becomes clear that it represents a large jump in complexity over character sets like ASCII that you may be more familiar with. It’s not just that Unicode contains a much larger number of characters, although that’s part of it. Unicode also has a great deal of internal structure, features, and special cases, making it much more than what one might expect a mere “character set” to be. We’ll see some of that later in this article.  When confronting all this complexity, especially as an engineer, it’s hard not to find oneself asking, “Why do we need all this? Is this really necessary? Couldn’t it be simplified?”  However, Unicode aims to faithfully represent the entire world’s writing systems. The Unicode Consortium’s stated goal is “enabling people around the world to use computers in any language”. And as you might imagine, the diversity of written languages is immense! To date, Unicode supports 135 different scripts, covering some 1100 languages, and there’s still a long tail of over 100 unsupported scripts, both modern and historical, which people are still working to add.  Given this enormous diversity, it’s inevitable that representing it is a complicated project. Unicode embraces that diversity, and accepts the complexity inherent in its mission to include all human writing systems. It doesn’t make a lot of trade-offs in the name of simplification, and it makes exceptions to its own rules where necessary to further its mission.  Moreover, Unicode is committed not just to supporting texts in any single language, but also to letting multiple languages coexist within one text—which introduces even more complexity.  Most programming languages have libraries available to handle the gory low-level details of text manipulation, but as a programmer, you’ll still need to know about certain Unicode features in order to know when and how to apply them. It may take some time to wrap your head around it all, but don’t be discouraged—think about the billions of people for whom your software will be more accessible through supporting text in their language. Embrace the complexity!  The Unicode Codespace Let’s start with some general orientation. The basic elements of Unicode—its “characters”, although that term isn’t quite right—are called code points. Code points are identified by number, customarily written in hexadecimal with the prefix “U+”, such as U+0041 “A” latin capital letter a or U+03B8 “θ” greek small letter theta. Each code point also has a short name, and quite a few other properties, specified in the Unicode Character Database.  The set of all possible code points is called the codespace. The Unicode codespace consists of 1,114,112 code points. However, only 128,237 of them—about 12% of the codespace—are actually assigned, to date. There’s plenty of room for growth! Unicode also reserves an additional 137,468 code points as “private use” areas, which have no standardized meaning and are available for individual applications to define for their own purposes.  Codespace Allocation To get a feel for how the codespace is laid out, it’s helpful to visualize it. Below is a map of the entire codespace, with one pixel per code point. It’s arranged in tiles for visual coherence; each small square is 16×16 = 256 code points, and each large square is a “plane” of 65,536 code points. There are 17 planes altogether.  Map of the Unicode codespace (click to zoom)  White represents unassigned space. Blue is assigned code points, green is private-use areas, and the small red area is surrogates (more about those later). As you can see, the assigned code points are distributed somewhat sparsely, but concentrated in the first three planes.  Plane 0 is also known as the “Basic Multilingual Plane”, or BMP. The BMP contains essentially all the characters needed for modern text in any script, including Latin, Cyrillic, Greek, Han (Chinese), Japanese, Korean, Arabic, Hebrew, Devanagari (Indian), and many more.  (In the past, the codespace was just the BMP and no more—Unicode was originally conceived as a straightforward 16-bit encoding, with only 65,536 code points. It was expanded to its current size in 1996. However, the vast majority of code points in modern text belong to the BMP.)  Plane 1 contains historical scripts, such as Sumerian cuneiform and Egyptian hieroglyphs, as well as emoji and various other symbols. Plane 2 contains a large block of less-common and historical Han characters. The remaining planes are empty, except for a small number of rarely-used formatting characters in Plane 14; planes 15–16 are reserved entirely for private use.  Scripts Let’s zoom in on the first three planes, since that’s where the action is:  Map of scripts in Unicode planes 0–2 (click to zoom)  This map color-codes the 135 different scripts in Unicode. You can see how Han () and Korean () take up most of the range of the BMP (the left large square). By contrast, all of the European, Middle Eastern, and South Asian scripts fit into the first row of the BMP in this diagram.  Many areas of the codespace are adapted or copied from earlier encodings. For example, the first 128 code points of Unicode are just a copy of ASCII. This has clear benefits for compatibility—it’s easy to losslessly convert texts from smaller encodings into Unicode (and the other direction too, as long as no characters outside the smaller encoding are used).  Usage Frequency One more interesting way to visualize the codespace is to look at the distribution of usage—in other words, how often each code point is actually used in real-world texts. Below is a heat map of planes 0–2 based on a large sample of text from Wikipedia and Twitter (all languages). Frequency increases from black (never seen) through red and yellow to white.  Heat map of code point usage frequency in Unicode planes 0–2 (click to zoom)  You can see that the vast majority of this text sample lies in the BMP, with only scattered usage of code points from planes 1–2. The biggest exception is emoji, which show up here as the several bright squares in the bottom row of plane 1.  Encodings We’ve seen that Unicode code points are abstractly identified by their index in the codespace, ranging from U+0000 to U+10FFFF. But how do code points get represented as bytes, in memory or in a file?  The most convenient, computer-friendliest (and programmer-friendliest) thing to do would be to just store the code point index as a 32-bit integer. This works, but it consumes 4 bytes per code point, which is sort of a lot. Using 32-bit ints for Unicode will cost you a bunch of extra storage, memory, and performance in bandwidth-bound scenarios, if you work with a lot of text.  Consequently, there are several more-compact encodings for Unicode. The 32-bit integer encoding is officially called UTF-32 (UTF = “Unicode Transformation Format”), but it’s rarely used for storage. At most, it comes up sometimes as a temporary internal representation, for examining or operating on the code points in a string.  Much more commonly, you’ll see Unicode text encoded as either UTF-8 or UTF-16. These are both variable-length encodings, made up of 8-bit or 16-bit units, respectively. In these schemes, code points with smaller index values take up fewer bytes, which saves a lot of memory for typical texts. The trade-off is that processing UTF-8/16 texts is more programmatically involved, and likely slower.  UTF-8 In UTF-8, each code point is stored using 1 to 4 bytes, based on its index value.  UTF-8 uses a system of binary prefixes, in which the high bits of each byte mark whether it’s a single byte, the beginning of a multi-byte sequence, or a continuation byte; the remaining bits, concatenated, give the code point index. This table shows how it works:  UTF-8 (binary)\tCode point (binary)\tRange 0xxxxxxx\txxxxxxx\tU+0000–U+007F 110xxxxx 10yyyyyy\txxxxxyyyyyy\tU+0080–U+07FF 1110xxxx 10yyyyyy 10zzzzzz\txxxxyyyyyyzzzzzz\tU+0800–U+FFFF 11110xxx 10yyyyyy 10zzzzzz 10wwwwww\txxxyyyyyyzzzzzzwwwwww\tU+10000–U+10FFFF A handy property of UTF-8 is that code points below 128 (ASCII characters) are encoded as single bytes, and all non-ASCII code points are encoded using sequences of bytes 128–255. This has a couple of nice consequences. First, any strings or files out there that are already in ASCII can also be interpreted as UTF-8 without any conversion. Second, lots of widely-used string programming idioms—such as null termination, or delimiters (newlines, tabs, commas, slashes, etc.)—will just work on UTF-8 strings. ASCII bytes never occur inside the encoding of non-ASCII code points, so searching byte-wise for a null terminator or a delimiter will do the right thing.  Thanks to this convenience, it’s relatively simple to extend legacy ASCII programs and APIs to handle UTF-8 strings. UTF-8 is very widely used in the Unix/Linux and Web worlds, and many programmers argue UTF-8 should be the default encoding everywhere.  However, UTF-8 isn’t a drop-in replacement for ASCII strings in all respects. For instance, code that iterates over the “characters” in a string will need to decode UTF-8 and iterate over code points (or maybe grapheme clusters—more about those later), not bytes. When you measure the “length” of a string, you’ll need to think about whether you want the length in bytes, the length in code points, the width of the text when rendered, or something else.  UTF-16 The other encoding that you’re likely to encounter is UTF-16. It uses 16-bit words, with each code point stored as either 1 or 2 words.  Like UTF-8, we can express the UTF-16 encoding rules in the form of binary prefixes:  UTF-16 (binary)\tCode point (binary)\tRange xxxxxxxxxxxxxxxx\txxxxxxxxxxxxxxxx\tU+0000–U+FFFF 110110xxxxxxxxxx 110111yyyyyyyyyy\txxxxxxxxxxyyyyyyyyyy + 0x10000\tU+10000–U+10FFFF A more common way that people talk about UTF-16 encoding, though, is in terms of code points called “surrogates”. All the code points in the range U+D800–U+DFFF—or in other words, the code points that match the binary prefixes 110110 and 110111 in the table above—are reserved specifically for UTF-16 encoding, and don’t represent any valid characters on their own. They’re only meant to occur in the 2-word encoding pattern above, which is called a “surrogate pair”. Surrogate code points are illegal in any other context! They’re not allowed in UTF-8 or UTF-32 at all.  Historically, UTF-16 is a descendant of the original, pre-1996 versions of Unicode, in which there were only 65,536 code points. The original intention was that there would be no different “encodings”; Unicode was supposed to be a straightforward 16-bit character set. Later, the codespace was expanded to make room for a long tail of less-common (but still important) Han characters, which the Unicode designers didn’t originally plan for. Surrogates were then introduced, as—to put it bluntly—a kludge, allowing 16-bit encodings to access the new code points.  Today, Javascript uses UTF-16 as its standard string representation: if you ask for the length of a string, or iterate over it, etc., the result will be in UTF-16 words, with any code points outside the BMP expressed as surrogate pairs. UTF-16 is also used by the Microsoft Win32 APIs; though Win32 supports either 8-bit or 16-bit strings, the 8-bit version unaccountably still doesn’t support UTF-8—only legacy code-page encodings, like ANSI. This leaves UTF-16 as the only way to get proper Unicode support in Windows. (Update: in Win10 version 1903, they finally added UTF-8 support to the 8-bit APIs! 😊)  By the way, UTF-16’s words can be stored either little-endian or big-endian. Unicode has no opinion on that issue, though it does encourage the convention of putting U+FEFF zero width no-break space at the top of a UTF-16 file as a byte-order mark, to disambiguate the endianness. (If the file doesn’t match the system’s endianness, the BOM will be decoded as U+FFFE, which isn’t a valid code point.)  Combining Marks In the story so far, we’ve been focusing on code points. But in Unicode, a “character” can be more complicated than just an individual code point!  Unicode includes a system for dynamically composing characters, by combining multiple code points together. This is used in various ways to gain flexibility without causing a huge combinatorial explosion in the number of code points.  In European languages, for example, this shows up in the application of diacritics to letters. Unicode supports a wide range of diacritics, including acute and grave accents, umlauts, cedillas, and many more. All these diacritics can be applied to any letter of any alphabet—and in fact, multiple diacritics can be used on a single letter.  If Unicode tried to assign a distinct code point to every possible combination of letter and diacritics, things would rapidly get out of hand. Instead, the dynamic composition system enables you to construct the character you want, by starting with a base code point (the letter) and appending additional code points, called “combining marks”, to specify the diacritics. When a text renderer sees a sequence like this in a string, it automatically stacks the diacritics over or under the base letter to create a composed character.  For example, the accented character “Á” can be expressed as a string of two code points: U+0041 “A” latin capital letter a plus U+0301 “◌́” combining acute accent. This string automatically gets rendered as a single character: “Á”.  Now, Unicode does also include many “precomposed” code points, each representing a letter with some combination of diacritics already applied, such as U+00C1 “Á” latin capital letter a with acute or U+1EC7 “ệ” latin small letter e with circumflex and dot below. I suspect these are mostly inherited from older encodings that were assimilated into Unicode, and kept around for compatibility. In practice, there are precomposed code points for most of the common letter-with-diacritic combinations in European-script languages, so they don’t use dynamic composition that much in typical text.  Still, the system of combining marks does allow for an arbitrary number of diacritics to be stacked on any base character. The reductio-ad-absurdum of this is Zalgo text, which works by ͖͟ͅr͞aṋ̫̠̖͈̗d͖̻̹óm̪͙͕̗̝ļ͇̰͓̳̫ý͓̥̟͍ ̕s̫t̫̱͕̗̰̼̘͜a̼̩͖͇̠͈̣͝c̙͍k̖̱̹͍͘i̢n̨̺̝͇͇̟͙ģ̫̮͎̻̟ͅ ̕n̼̺͈͞u̮͙m̺̭̟̗͞e̞͓̰̤͓̫r̵o̖ṷs҉̪͍̭̬̝̤ ̮͉̝̞̗̟͠d̴̟̜̱͕͚i͇̫̼̯̭̜͡ḁ͙̻̼c̲̲̹r̨̠̹̣̰̦i̱t̤̻̤͍͙̘̕i̵̜̭̤̱͎c̵s ͘o̱̲͈̙͖͇̲͢n͘ ̜͈e̬̲̠̩ac͕̺̠͉h̷̪ ̺̣͖̱ḻ̫̬̝̹ḙ̙̺͙̭͓̲t̞̞͇̲͉͍t̷͔̪͉̲̻̠͙e̦̻͈͉͇r͇̭̭̬͖,̖́ ̜͙͓̣̭s̘̘͈o̱̰̤̲ͅ ̛̬̜̙t̼̦͕̱̹͕̥h̳̲͈͝ͅa̦t̻̲ ̻̟̭̦̖t̛̰̩h̠͕̳̝̫͕e͈̤̘͖̞͘y҉̝͙ ̷͉͔̰̠o̞̰v͈͈̳̘͜er̶f̰͈͔ḻ͕̘̫̺̲o̲̭͙͠ͅw̱̳̺ ͜t̸h͇̭͕̳͍e̖̯̟̠ ͍̞̜͔̩̪͜ļ͎̪̲͚i̝̲̹̙̩̹n̨̦̩̖ḙ̼̲̼͢ͅ ̬͝s̼͚̘̞͝p͙̘̻a̙c҉͉̜̤͈̯̖i̥͡n̦̠̱͟g̸̗̻̦̭̮̟ͅ ̳̪̠͖̳̯̕a̫͜n͝d͡ ̣̦̙ͅc̪̗r̴͙̮̦̹̳e͇͚̞͔̹̫͟a̙̺̙ț͔͎̘̹ͅe̥̩͍ a͖̪̜̮͙̹n̢͉̝ ͇͉͓̦̼́a̳͖̪̤̱p̖͔͔̟͇͎͠p̱͍̺ę̲͎͈̰̲̤̫a̯͜r̨̮̫̣̘a̩̯͖n̹̦̰͎̣̞̞c̨̦̱͔͎͍͖e̬͓͘ ̤̰̩͙̤̬͙o̵̼̻̬̻͇̮̪f̴ ̡̙̭͓͖̪̤“̸͙̠̼c̳̗͜o͏̼͙͔̮r̞̫̺̞̥̬ru̺̻̯͉̭̻̯p̰̥͓̣̫̙̤͢t̳͍̳̖ͅi̶͈̝͙̼̙̹o̡͔n̙̺̹̖̩͝ͅ”̨̗͖͚̩.̯͓  A few other places where dynamic character composition shows up in Unicode:  Vowel-pointing notation in Arabic and Hebrew. In these languages, words are normally spelled with some of their vowels left out. They then have diacritic notation to indicate the vowels (used in dictionaries, language-teaching materials, children’s books, and such). These diacritics are expressed with combining marks.  A Hebrew example, with niqqud:\tאֶת דַלְתִּי הֵזִיז הֵנִיעַ, קֶטֶב לִשְׁכַּתִּי יָשׁוֹד Normal writing (no niqqud):\tאת דלתי הזיז הניע, קטב לשכתי ישוד Devanagari, the script used to write Hindi, Sanskrit, and many other South Asian languages, expresses certain vowels as combining marks attached to consonant letters. For example, “ह” + “\u200bि” = “हि” (“h” + “i” = “hi”). Korean characters stand for syllables, but they are composed of letters called jamo that stand for the vowels and consonants in the syllable. While there are code points for precomposed Korean syllables, it’s also possible to dynamically compose them by concatenating their jamo. For example, “ᄒ” + “ᅡ” + “ᆫ” = “한” (“h” + “a” + “n” = “han”). Canonical Equivalence In Unicode, precomposed characters exist alongside the dynamic composition system. A consequence of this is that there are multiple ways to express “the same” string—different sequences of code points that result in the same user-perceived characters. For example, as we saw earlier, we can express the character “Á” either as the single code point U+00C1, or as the string of two code points U+0041 U+0301.  Another source of ambiguity is the ordering of multiple diacritics in a single character. Diacritic order matters visually when two diacritics apply to the same side of the base character, e.g. both above: “ǡ” (dot, then macron) is different from “ā̇” (macron, then dot). However, when diacritics apply to different sides of the character, e.g. one above and one below, then the order doesn’t affect rendering. Moreover, a character with multiple diacritics might have one of the diacritics precomposed and others expressed as combining marks.  For example, the Vietnamese letter “ệ” can be expressed in five different ways:  Fully precomposed: U+1EC7 “ệ” Partially precomposed: U+1EB9 “ẹ” + U+0302 “◌̂” Partially precomposed: U+00EA “ê” + U+0323 “◌̣” Fully decomposed: U+0065 “e” + U+0323 “◌̣” + U+0302 “◌̂” Fully decomposed: U+0065 “e” + U+0302 “◌̂” + U+0323 “◌̣” Unicode refers to set of strings like this as “canonically equivalent”. Canonically equivalent strings are supposed to be treated as identical for purposes of searching, sorting, rendering, text selection, and so on. This has implications for how you implement operations on text. For example, if an app has a “find in file” operation and the user searches for “ệ”, it should, by default, find occurrences of any of the five versions of “ệ” above!  Normalization Forms To address the problem of “how to handle canonically equivalent strings”, Unicode defines several normalization forms: ways of converting strings into a canonical form so that they can be compared code-point-by-code-point (or byte-by-byte).  The “NFD” normalization form fully decomposes every character down to its component base and combining marks, taking apart any precomposed code points in the string. It also sorts the combining marks in each character according to their rendered position, so e.g. diacritics that go below the character come before the ones that go above the character. (It doesn’t reorder diacritics in the same rendered position, since their order matters visually, as previously mentioned.)  The “NFC” form, conversely, puts things back together into precomposed code points as much as possible. If an unusual combination of diacritics is called for, there may not be any precomposed code point for it, in which case NFC still precomposes what it can and leaves any remaining combining marks in place (again ordered by rendered position, as in NFD).  There are also forms called NFKD and NFKC. The “K” here refers to compatibility decompositions, which cover characters that are “similar” in some sense but not visually identical. However, I’m not going to cover that here.  Grapheme Clusters As we’ve seen, Unicode contains various cases where a thing that a user thinks of as a single “character” might actually be made up of multiple code points under the hood. Unicode formalizes this using the notion of a grapheme cluster: a string of one or more code points that constitute a single “user-perceived character”.  UAX #29 defines the rules for what, precisely, qualifies as a grapheme cluster. It’s approximately “a base code point followed by any number of combining marks”, but the actual definition is a bit more complicated; it accounts for things like Korean jamo, and emoji ZWJ sequences.  The main thing grapheme clusters are used for is text editing: they’re often the most sensible unit for cursor placement and text selection boundaries. Using grapheme clusters for these purposes ensures that you can’t accidentally chop off some diacritics when you copy-and-paste text, that left/right arrow keys always move the cursor by one visible character, and so on.  Another place where grapheme clusters are useful is in enforcing a string length limit—say, on a database field. While the true, underlying limit might be something like the byte length of the string in UTF-8, you wouldn’t want to enforce that by just truncating bytes. At a minimum, you’d want to “round down” to the nearest code point boundary; but even better, round down to the nearest grapheme cluster boundary. Otherwise, you might be corrupting the last character by cutting off a diacritic, or interrupting a jamo sequence or ZWJ sequence.  And More… There’s much more that could be said about Unicode from a programmer’s perspective! I haven’t gotten into such fun topics as case mapping, collation, compatibility decompositions and confusables, Unicode-aware regexes, or bidirectional text. Nor have I said anything yet about implementation issues—how to efficiently store and look-up data about the sparsely-assigned code points, or how to optimize UTF-8 decoding, string comparison, or NFC normalization. Perhaps I’ll return to some of those things in future posts.  Unicode is a fascinating and complex system. It has a many-to-one mapping between bytes and code points, and on top of that a many-to-one (or, under some circumstances, many-to-many) mapping between code points and “characters”. It has oddball special cases in every corner. But no one ever claimed that representing all written languages was going to be easy, and it’s clear that we’re never going back to the bad old days of a patchwork of incompatible encodings.  Further reading:  The Unicode Standard UTF-8 Everywhere Manifesto Dark corners of Unicode by Eevee ICU (International Components for Unicode)—C/C++/Java libraries implementing many Unicode algorithms and related things Python 3 Unicode Howto Google Noto Fonts—set of fonts intended to cover all assigned code points"""
diff --git a/smolbpe/gpt4Tokenizer.py b/smolbpe/gpt4Tokenizer.py
index 4cb8626..d97a2e1 100644
--- a/smolbpe/gpt4Tokenizer.py
+++ b/smolbpe/gpt4Tokenizer.py
@@ -4,12 +4,12 @@
 
 
 class GPT4Tokenizer():
-    def __init__(self, path='vocab.json', pattern=None):
+    def __init__(self, output='vocab.json', pattern=None):
         self.vocab = {idx : bytes([idx]) for idx in range(256)}
         self.merges = dict()
         self.pattern = pattern if pattern else r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]"
         self.splitby = re.compile(self.pattern)
-        self.path = path
+        self.output_file = output
 
 
     def train(self, text, vocab_size):
@@ -68,7 +68,7 @@ def get_pairs(self, ids, counts=None):
         return counts
 
 
-    def save_vocab_and_merges(self, path):
+    def save_vocab_and_merges(self):
         data = {
             'vocab': {},
             'merges': {}
@@ -83,7 +83,7 @@ def save_vocab_and_merges(self, path):
         for (first, second), idx in self.merges.items():
             key = f"{first},{second}"  # Convert tuple to string
             data['merges'][key] = idx
-        with open(path, 'w', encoding='utf-8') as f:
+        with open(self.output_file, 'w', encoding='utf-8') as f:
             json.dump(data, f, indent=2)
             
             
diff --git a/tests/__init__.py b/tests/__init__.py
deleted file mode 100644
index e69de29..0000000
diff --git a/tests/character_tokenizing.py b/tests/character_tokenizing.py
deleted file mode 100644
index c674426..0000000
--- a/tests/character_tokenizing.py
+++ /dev/null
@@ -1,14 +0,0 @@
-import sys
-import os
-sys.path.append(os.path.abspath('../data'))
-
-from smolbpe.data import text
-
-vocab = list(set(text))
-stoi = {ch:i for i, ch in enumerate(vocab)} 
-itos = {i:ch for ch, i in stoi.items()}
-
-encode = lambda text: [stoi[i] for i in text]
-decode = lambda idx: "".join(itos[i] for i in idx)
-
-print(decode(encode("Hello world")))
diff --git a/tests/tokenization.ipynb b/tests/tokenization.ipynb
deleted file mode 100644
index 90d399a..0000000
--- a/tests/tokenization.ipynb
+++ /dev/null
@@ -1,651 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Tokenization"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "a = \"안녕하세요 👋 (hello in Korean!)\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "[50504,\n",
-       " 45397,\n",
-       " 54616,\n",
-       " 49464,\n",
-       " 50836,\n",
-       " 32,\n",
-       " 128075,\n",
-       " 32,\n",
-       " 40,\n",
-       " 104,\n",
-       " 101,\n",
-       " 108,\n",
-       " 108,\n",
-       " 111,\n",
-       " 32,\n",
-       " 105,\n",
-       " 110,\n",
-       " 32,\n",
-       " 75,\n",
-       " 111,\n",
-       " 114,\n",
-       " 101,\n",
-       " 97,\n",
-       " 110,\n",
-       " 33,\n",
-       " 41]"
-      ]
-     },
-     "execution_count": 2,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "[ord(ch) for ch in a]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "[236,\n",
-       " 149,\n",
-       " 136,\n",
-       " 235,\n",
-       " 133,\n",
-       " 149,\n",
-       " 237,\n",
-       " 149,\n",
-       " 152,\n",
-       " 236,\n",
-       " 132,\n",
-       " 184,\n",
-       " 236,\n",
-       " 154,\n",
-       " 148,\n",
-       " 32,\n",
-       " 240,\n",
-       " 159,\n",
-       " 145,\n",
-       " 139,\n",
-       " 32,\n",
-       " 40,\n",
-       " 104,\n",
-       " 101,\n",
-       " 108,\n",
-       " 108,\n",
-       " 111,\n",
-       " 32,\n",
-       " 105,\n",
-       " 110,\n",
-       " 32,\n",
-       " 75,\n",
-       " 111,\n",
-       " 114,\n",
-       " 101,\n",
-       " 97,\n",
-       " 110,\n",
-       " 33,\n",
-       " 41]"
-      ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list(a.encode('utf-8'))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 15,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "114"
-      ]
-     },
-     "execution_count": 15,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "import sys\n",
-    "import os \n",
-    "sys.path.append(os.path.abspath('../data'))\n",
-    "\n",
-    "from text import text\n",
-    "tokens = text.encode('utf-8')\n",
-    "tokens = list(map(int, tokens))\n",
-    "tokens[3]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "{(65, 32): 8, (32, 80): 10, (80, 114): 1, (114, 111): 62, (111, 103): 23, (103, 114): 25, (114, 97): 106, (97, 109): 47, (109, 109): 20, (109, 101): 69, (101, 114): 294, (114, 226): 8, (226, 128): 254, (128, 153): 64, (153, 115): 29, (115, 32): 424, (32, 73): 36, (73, 110): 15, (110, 116): 176, (116, 114): 50, (111, 100): 183, (100, 117): 8, (117, 99): 19, (99, 116): 68, (116, 105): 168, (105, 111): 76, (111, 110): 173, (110, 32): 241, (32, 116): 405, (116, 111): 124, (111, 32): 137, (32, 85): 127, (85, 110): 60, (110, 105): 98, (105, 99): 146, (99, 111): 290, (100, 101): 232, (101, 32): 646, (32, 77): 16, (77, 97): 7, (97, 114): 181, (114, 99): 11, (99, 104): 89, (104, 32): 76, (32, 51): 6, (51, 44): 2, (44, 32): 243, (32, 50): 6, (50, 48): 1, (48, 49): 7, (49, 55): 2, (55, 32): 5, (32, 194): 2, (194, 183): 2, (183, 32): 2, (32, 67): 22, (67, 111): 17, (100, 105): 88, (105, 110): 446, (110, 103): 200, (103, 32): 111, (50, 50): 1, (50, 32): 14, (111, 109): 114, (101, 110): 174, (116, 115): 102, (32, 32): 64, (32, 239): 1, (239, 188): 1, (188, 181): 1, (181, 239): 1, (239, 189): 6, (189, 142): 1, (142, 239): 1, (189, 137): 1, (137, 239): 1, (189, 131): 1, (131, 239): 1, (189, 143): 1, (143, 239): 1, (189, 132): 1, (132, 239): 1, (189, 133): 1, (133, 33): 1, (33, 32): 10, (32, 240): 4, (240, 159): 16, (159, 133): 7, (133, 164): 1, (164, 240): 1, (133, 157): 1, (157, 240): 1, (133, 152): 1, (152, 240): 1, (133, 146): 1, (146, 240): 1, (133, 158): 1, (158, 240): 1, (133, 147): 1, (147, 240): 1, (133, 148): 1, (148, 226): 1, (128, 189): 1, (189, 32): 1, (159, 135): 7, (135, 186): 1, (186, 226): 1, (128, 140): 6, (140, 240): 6, (135, 179): 1, (179, 226): 1, (135, 174): 1, (174, 226): 1, (135, 168): 1, (168, 226): 1, (135, 180): 1, (180, 226): 1, (135, 169): 1, (169, 226): 1, (135, 170): 1, (170, 33): 1, (159, 152): 2, (152, 132): 1, (132, 32): 1, (32, 84): 46, (84, 104): 40, (104, 101): 279, (32, 118): 28, (118, 101): 91, (114, 121): 26, (121, 32): 154, (32, 110): 52, (110, 97): 49, (32, 115): 222, (115, 116): 131, (114, 105): 120, (105, 107): 12, (107, 101): 20, (101, 115): 191, (32, 102): 102, (102, 101): 19, (101, 97): 60, (114, 32): 193, (32, 97): 377, (97, 110): 229, (110, 100): 137, (100, 32): 213, (97, 119): 3, (119, 101): 31, (32, 105): 230, (116, 104): 337, (32, 104): 46, (114, 116): 36, (32, 111): 220, (111, 102): 116, (102, 32): 116, (32, 112): 152, (112, 114): 61, (114, 115): 60, (32, 119): 127, (119, 111): 28, (111, 114): 218, (114, 108): 8, (108, 100): 17, (100, 119): 2, (119, 105): 41, (105, 100): 32, (101, 46): 26, (46, 32): 154, (32, 87): 15, (87, 101): 4, (97, 108): 146, (108, 108): 107, (108, 32): 87, (32, 107): 8, (107, 110): 5, (110, 111): 41, (111, 119): 57, (119, 32): 29, (111, 117): 88, (117, 103): 9, (103, 104): 22, (104, 116): 14, (116, 32): 285, (32, 226): 68, (128, 156): 71, (156, 115): 4, (115, 117): 40, (117, 112): 25, (112, 112): 26, (112, 111): 123, (101, 226): 25, (128, 157): 71, (157, 32): 53, (117, 114): 34, (115, 111): 47, (102, 116): 9, (116, 119): 7, (119, 97): 25, (114, 101): 255, (32, 40): 39, (40, 119): 1, (119, 104): 37, (104, 97): 117, (97, 116): 154, (116, 101): 221, (101, 118): 28, (32, 109): 109, (110, 115): 37, (115, 226): 14, (128, 148): 25, (148, 108): 1, (108, 105): 58, (32, 117): 46, (117, 115): 66, (115, 105): 75, (119, 99): 1, (114, 95): 1, (95, 116): 1, (102, 111): 63, (103, 115): 28, (115, 44): 71, (32, 114): 61, (105, 103): 30, (116, 63): 1, (63, 41): 1, (41, 46): 11, (32, 66): 18, (66, 117): 4, (117, 116): 54, (32, 99): 267, (99, 97): 73, (32, 98): 122, (98, 101): 51, (97, 98): 40, (98, 115): 4, (114, 117): 11, (115, 101): 146, (101, 44): 36, (32, 100): 97, (105, 118): 27, (118, 105): 13, (104, 111): 34, (115, 97): 21, (100, 45): 3, (45, 112): 8, (112, 97): 41, (97, 103): 31, (103, 101): 53, (32, 83): 12, (83, 116): 3, (116, 97): 54, (100, 97): 17, (114, 100): 25, (112, 108): 70, (108, 117): 21, (105, 116): 176, (100, 111): 24, (111, 122): 1, (122, 101): 8, (108, 101): 153, (101, 109): 42, (110, 110): 4, (110, 101): 71, (101, 120): 75, (120, 101): 6, (101, 112): 19, (111, 116): 40, (109, 111): 47, (97, 32): 93, (32, 108): 90, (116, 116): 35, (116, 108): 7, (105, 109): 26, (109, 105): 30, (103, 46): 8, (73, 32): 13, (110, 226): 21, (153, 116): 18, (98, 108): 26, (108, 97): 69, (105, 108): 46, (102, 105): 37, (111, 108): 9, (104, 105): 71, (109, 121): 2, (121, 115): 17, (32, 101): 108, (51, 48): 6, (48, 32): 7, (32, 121): 26, (121, 101): 3, (97, 102): 2, (110, 99): 64, (99, 101): 71, (112, 116): 24, (110, 46): 9, (32, 65): 34, (101, 119): 11, (104, 115): 2, (103, 111): 14, (111, 44): 3, (32, 103): 32, (101, 100): 128, (101, 99): 44, (99, 105): 16, (115, 112): 31, (112, 101): 35, (114, 110): 12, (98, 111): 28, (101, 116): 53, (97, 105): 30, (108, 46): 3, (105, 115): 96, (99, 108): 22, (73, 226): 5, (153, 108): 6, (103, 105): 10, (102, 114): 14, (109, 32): 30, (111, 105): 75, (105, 101): 29, (119, 46): 3, (153, 109): 4, (111, 99): 10, (99, 117): 16, (97, 99): 131, (116, 226): 24, (110, 118): 9, (118, 111): 6, (108, 118): 2, (114, 107): 22, (107, 105): 6, (120, 116): 29, (116, 46): 14, (32, 72): 18, (72, 111): 8, (114, 44): 21, (108, 107): 2, (107, 32): 20, (97, 121): 17, (121, 111): 25, (116, 47): 2, (47, 115): 1, (115, 104): 9, (97, 112): 38, (112, 105): 14, (103, 47): 1, (47, 114): 2, (103, 44): 13, (108, 111): 32, (105, 122): 12, (122, 97): 6, (108, 226): 1, (148, 116): 3, (111, 115): 54, (115, 115): 39, (117, 101): 22, (101, 121): 10, (115, 99): 17, (111, 112): 24, (40, 97): 5, (119, 108): 2, (100, 103): 2, (101, 41): 5, (41, 32): 17, (32, 68): 7, (68, 105): 3, (116, 121): 25, (110, 104): 4, (109, 112): 70, (120, 105): 11, (65, 108): 4, (83, 99): 2, (99, 114): 40, (105, 112): 21, (85, 115): 4, (32, 70): 20, (70, 114): 3, (101, 113): 17, (113, 117): 28, (99, 121): 6, (32, 69): 13, (69, 110): 2, (85, 84): 40, (84, 70): 40, (70, 45): 39, (45, 56): 22, (56, 32): 21, (45, 49): 16, (49, 54): 25, (54, 32): 20, (109, 98): 29, (98, 105): 55, (107, 115): 18, (67, 97): 3, (69, 113): 2, (117, 105): 8, (118, 97): 24, (32, 78): 11, (78, 111): 6, (114, 109): 26, (109, 97): 81, (70, 111): 12, (109, 115): 12, (32, 71): 5, (71, 114): 3, (112, 104): 11, (67, 108): 2, (65, 110): 5, (77, 111): 5, (128, 166): 2, (166, 32): 2, (65, 115): 5, (111, 111): 13, (97, 115): 107, (117, 32): 18, (116, 117): 11, (117, 100): 9, (100, 121): 10, (114, 103): 7, (32, 106): 13, (106, 117): 9, (117, 109): 16, (112, 32): 21, (111, 118): 19, (65, 83): 9, (83, 67): 9, (67, 73): 9, (73, 73): 9, (102, 97): 7, (105, 97): 45, (104, 46): 1, (73, 116): 11, (109, 117): 14, (110, 117): 11, (108, 116): 16, (108, 115): 19, (97, 107): 9, (120, 112): 13, (156, 99): 8, (101, 101): 25, (87, 104): 7, (110, 102): 4, (121, 44): 16, (108, 121): 69, (101, 108): 43, (108, 102): 1, (115, 107): 3, (156, 87): 1, (104, 121): 1, (115, 63): 1, (63, 32): 3, (73, 115): 4, (121, 63): 1, (117, 108): 34, (100, 110): 3, (105, 102): 20, (100, 63): 1, (63, 226): 1, (104, 102): 1, (102, 117): 8, (105, 114): 22, (100, 226): 3, (119, 114): 8, (115, 121): 15, (115, 46): 37, (105, 117): 1, (109, 226): 3, (111, 97): 1, (156, 101): 5, (101, 111): 7, (117, 110): 27, (112, 117): 9, (110, 121): 28, (103, 117): 18, (117, 97): 35, (157, 46): 7, (101, 33): 3, (84, 111): 4, (32, 49): 41, (49, 51): 3, (51, 53): 2, (53, 32): 4, (102, 102): 14, (49, 49): 19, (49, 48): 24, (48, 48): 32, (108, 44): 4, (97, 100): 18, (100, 100): 7, (100, 46): 5, (71, 105): 1, (111, 106): 4, (106, 101): 1, (98, 114): 9, (99, 99): 13, (104, 117): 2, (111, 101): 9, (115, 110): 8, (101, 45): 15, (45, 111): 5, (102, 115): 1, (110, 44): 16, (120, 99): 3, (119, 110): 7, (103, 108): 11, (98, 117): 14, (148, 119): 2, (121, 46): 4, (97, 118): 14, (105, 98): 17, (100, 108): 7, (119, 45): 1, (45, 108): 2, (117, 226): 5, (109, 46): 4, (110, 107): 4, (104, 114): 4, (101, 105): 17, (69, 109): 1, (121, 33): 1, (32, 76): 5, (76, 101): 2, (98, 97): 16, (99, 32): 10, (148, 105): 3, (157, 44): 7, (32, 113): 3, (148, 97): 6, (98, 121): 36, (120, 97): 11, (101, 102): 19, (105, 120): 6, (120, 32): 12, (156, 85): 2, (85, 43): 39, (43, 226): 1, (43, 48): 24, (48, 52): 3, (52, 49): 3, (49, 32): 9, (156, 65): 2, (65, 226): 2, (48, 51): 10, (51, 66): 1, (66, 56): 1, (156, 206): 1, (206, 184): 1, (184, 226): 1, (101, 107): 2, (115, 109): 8, (97, 46): 1, (69, 97): 2, (67, 104): 2, (68, 97): 2, (49, 44): 2, (44, 49): 2, (49, 52): 2, (52, 44): 1, (49, 50): 6, (110, 108): 8, (50, 56): 4, (56, 44): 4, (44, 50): 1, (50, 51): 4, (51, 55): 2, (50, 37): 1, (37, 32): 1, (103, 110): 8, (100, 44): 9, (119, 116): 2, (104, 33): 1, (114, 118): 3, (55, 44): 1, (44, 52): 1, (52, 54): 1, (54, 56): 1, (156, 112): 3, (114, 112): 4, (116, 44): 18, (108, 112): 2, (112, 102): 1, (66, 101): 2, (114, 114): 12, (111, 104): 1, (101, 59): 2, (59, 32): 7, (115, 113): 4, (54, 195): 1, (195, 151): 1, (151, 49): 1, (32, 61): 6, (61, 32): 6, (50, 53): 2, (53, 54): 1, (32, 54): 3, (54, 53): 5, (53, 44): 3, (44, 53): 3, (53, 51): 3, (51, 54): 3, (114, 46): 12, (40, 99): 3, (99, 107): 9, (32, 122): 5, (122, 111): 4, (109, 41): 3, (66, 108): 1, (45, 117): 4, (103, 97): 13, (40, 109): 2, (114, 41): 3, (80, 108): 5, (32, 48): 6, (156, 66): 1, (66, 97): 1, (77, 117): 2, (66, 77): 8, (77, 80): 8, (80, 46): 2, (80, 32): 5, (76, 97): 2, (67, 121): 1, (121, 114): 1, (99, 44): 3, (107, 44): 2, (72, 97): 4, (40, 67): 1, (41, 44): 4, (32, 74): 2, (74, 97): 3, (32, 75): 5, (75, 111): 5, (65, 114): 2, (72, 101): 4, (101, 98): 4, (119, 44): 3, (68, 101): 2, (105, 32): 3, (40, 73): 5, (110, 41): 3, (148, 85): 1, (116, 102): 2, (114, 119): 3, (54, 45): 6, (45, 98): 19, (49, 57): 3, (57, 57): 2, (57, 54): 2, (54, 46): 3, (97, 106): 2, (106, 111): 2, (46, 41): 4, (83, 117): 3, (69, 103): 1, (103, 121): 1, (121, 112): 4, (106, 105): 3, (121, 109): 1, (115, 45): 2, (45, 99): 5, (121, 45): 9, (52, 59): 1, (49, 53): 1, (53, 226): 1, (128, 147): 13, (147, 49): 1, (115, 58): 6, (58, 32): 19, (48, 226): 10, (147, 50): 5, (114, 45): 6, (32, 89): 2, (89, 111): 2, (40, 41): 2, (40, 116): 2, (66, 121): 2, (69, 117): 3, (77, 105): 2, (83, 111): 2, (112, 121): 2, (73, 46): 2, (121, 226): 5, (115, 108): 5, (100, 41): 2, (32, 79): 2, (79, 110): 1, (111, 107): 3, (100, 115): 8, (108, 45): 2, (45, 119): 4, (87, 105): 5, (84, 119): 1, (115, 41): 2, (40, 110): 3, (80, 44): 1, (49, 226): 1, (50, 46): 1, (103, 103): 1, (105, 44): 3, (49, 46): 2, (153, 118): 3, (43, 49): 8, (48, 70): 3, (70, 70): 21, (70, 46): 1, (121, 116): 22, (101, 63): 1, (45, 102): 2, (116, 41): 3, (51, 50): 10, (50, 45): 4, (101, 103): 7, (32, 52): 2, (52, 32): 2, (114, 102): 1, (100, 116): 3, (104, 45): 2, (45, 51): 2, (40, 85): 2, (70, 32): 8, (84, 114): 1, (115, 102): 1, (157, 41): 3, (65, 116): 2, (103, 116): 7, (32, 56): 4, (56, 45): 4, (56, 47): 1, (47, 49): 1, (105, 45): 1, (120, 46): 1, (119, 115): 4, (40, 98): 5, (121, 41): 5, (41, 9): 4, (9, 67): 2, (9, 82): 2, (82, 97): 2, (48, 120): 6, (120, 120): 78, (120, 9): 4, (9, 120): 6, (9, 85): 6, (147, 85): 7, (48, 55): 2, (55, 70): 2, (48, 121): 3, (121, 121): 48, (121, 9): 3, (120, 121): 4, (48, 56): 2, (56, 48): 3, (48, 122): 2, (122, 122): 20, (122, 9): 2, (121, 122): 2, (43, 70): 4, (122, 32): 1, (48, 119): 1, (119, 119): 10, (119, 9): 2, (122, 119): 1, (40, 65): 1, (110, 45): 3, (45, 65): 2, (56, 226): 2, (53, 53): 1, (53, 46): 1, (70, 105): 1, (108, 114): 2, (83, 101): 1, (148, 115): 3, (116, 99): 5, (99, 46): 2, (41, 226): 2, (65, 80): 3, (80, 73): 3, (120, 47): 1, (47, 76): 1, (76, 105): 2, (117, 120): 1, (98, 32): 1, (97, 117): 6, (121, 119): 2, (100, 114): 3, (112, 45): 1, (45, 105): 1, (40, 111): 3, (121, 98): 1, (148, 109): 1, (156, 108): 1, (104, 226): 3, (153, 114): 5, (32, 120): 1, (49, 121): 1, (32, 43): 13, (43, 32): 13, (120, 49): 1, (48, 9): 1, (104, 44): 1, (43, 68): 2, (68, 56): 1, (68, 70): 1, (70, 226): 1, (148, 111): 2, (116, 33): 2, (72, 105): 2, (157, 59): 1, (107, 108): 1, (110, 58): 1, (46, 44): 1, (110, 51): 2, (115, 59): 1, (65, 78): 1, (78, 83): 1, (83, 73): 1, (85, 112): 1, (112, 100): 1, (101, 58): 3, (110, 49): 1, (57, 48): 1, (115, 33): 1, (152, 138): 1, (138, 41): 1, (54, 226): 1, (45, 101): 2, (103, 45): 1, (70, 69): 2, (69, 70): 1, (111, 45): 5, (73, 102): 3, (66, 79): 1, (79, 77): 1, (77, 32): 1, (69, 44): 1, (121, 110): 6, (102, 108): 2, (99, 115): 20, (109, 108): 1, (102, 121): 1, (156, 195): 5, (195, 129): 4, (129, 226): 5, (156, 226): 9, (226, 151): 7, (151, 140): 7, (140, 204): 7, (204, 129): 3, (114, 58): 2, (48, 67): 2, (67, 49): 2, (49, 69): 3, (69, 67): 2, (67, 55): 2, (156, 225): 9, (225, 187): 5, (187, 135): 5, (135, 226): 6, (109, 102): 1, (45, 100): 1, (45, 115): 1, (114, 98): 1, (45, 97): 5, (32, 90): 3, (90, 97): 1, (108, 103): 2, (32, 205): 5, (205, 150): 14, (150, 205): 7, (205, 159): 3, (159, 205): 7, (205, 133): 11, (133, 114): 1, (114, 205): 2, (205, 158): 3, (158, 97): 1, (97, 225): 1, (225, 185): 2, (185, 139): 1, (139, 204): 1, (204, 171): 16, (171, 204): 9, (204, 160): 12, (160, 204): 5, (204, 150): 11, (205, 136): 15, (136, 204): 8, (204, 151): 9, (151, 100): 1, (100, 205): 2, (150, 204): 11, (204, 187): 14, (187, 204): 12, (204, 185): 15, (185, 195): 1, (195, 179): 1, (179, 109): 1, (109, 204): 2, (204, 170): 12, (170, 205): 4, (205, 153): 18, (153, 205): 7, (205, 149): 10, (149, 204): 8, (151, 204): 4, (204, 157): 10, (157, 196): 1, (196, 188): 2, (188, 205): 5, (205, 135): 14, (135, 204): 9, (204, 176): 13, (176, 205): 3, (205, 147): 11, (147, 204): 8, (204, 179): 13, (179, 204): 9, (171, 195): 1, (195, 189): 1, (189, 205): 1, (204, 165): 6, (165, 204): 3, (204, 159): 10, (205, 141): 12, (141, 32): 2, (32, 204): 14, (204, 149): 4, (149, 115): 1, (115, 204): 3, (171, 116): 1, (116, 204): 9, (204, 177): 14, (177, 205): 6, (176, 204): 9, (204, 188): 14, (188, 204): 9, (204, 152): 11, (152, 205): 4, (205, 156): 7, (156, 97): 3, (97, 204): 8, (204, 169): 11, (169, 205): 4, (160, 205): 6, (204, 163): 11, (163, 205): 2, (205, 157): 6, (157, 99): 1, (99, 204): 6, (204, 153): 13, (141, 107): 1, (107, 204): 1, (177, 204): 5, (185, 205): 3, (141, 205): 3, (205, 152): 5, (152, 105): 1, (105, 204): 6, (204, 162): 2, (162, 110): 2, (110, 204): 7, (204, 168): 6, (168, 204): 6, (204, 186): 13, (186, 204): 9, (157, 205): 5, (135, 205): 4, (153, 196): 1, (196, 163): 1, (163, 204): 7, (204, 174): 9, (174, 205): 4, (205, 142): 8, (142, 204): 4, (133, 32): 4, (149, 110): 1, (186, 205): 2, (136, 205): 5, (158, 117): 1, (117, 204): 2, (204, 173): 14, (173, 204): 9, (159, 204): 4, (151, 205): 3, (158, 101): 1, (101, 204): 6, (204, 158): 13, (158, 205): 5, (204, 164): 14, (164, 205): 4, (171, 114): 1, (114, 204): 6, (204, 181): 4, (181, 111): 1, (111, 204): 7, (150, 225): 2, (185, 183): 1, (183, 115): 1, (115, 210): 1, (210, 137): 3, (137, 204): 7, (141, 204): 4, (204, 172): 10, (172, 204): 5, (157, 204): 6, (164, 32): 1, (205, 137): 10, (158, 204): 7, (205, 160): 3, (160, 100): 1, (100, 204): 1, (204, 180): 3, (180, 204): 1, (204, 156): 9, (156, 204): 6, (149, 205): 1, (205, 154): 5, (154, 105): 2, (105, 205): 1, (204, 175): 9, (175, 204): 4, (156, 205): 4, (205, 161): 3, (161, 225): 1, (225, 184): 5, (184, 129): 1, (129, 205): 1, (153, 204): 19, (188, 99): 2, (204, 178): 18, (178, 204): 8, (185, 114): 1, (185, 204): 6, (204, 166): 13, (166, 105): 1, (177, 116): 1, (164, 204): 8, (152, 204): 6, (149, 105): 1, (181, 204): 2, (142, 99): 1, (181, 115): 1, (152, 111): 1, (178, 205): 7, (205, 162): 3, (110, 205): 2, (152, 32): 2, (136, 101): 1, (169, 97): 1, (99, 205): 1, (137, 104): 1, (104, 204): 3, (204, 183): 3, (183, 204): 1, (170, 32): 3, (177, 225): 1, (184, 187): 2, (185, 225): 1, (184, 153): 2, (173, 205): 4, (178, 116): 1, (137, 205): 5, (141, 116): 1, (183, 205): 2, (205, 148): 11, (148, 204): 6, (153, 101): 1, (166, 204): 10, (187, 205): 3, (135, 114): 1, (172, 205): 4, (150, 44): 1, (44, 204): 1, (129, 32): 1, (173, 115): 1, (136, 111): 1, (204, 155): 2, (155, 204): 2, (166, 205): 1, (165, 104): 1, (133, 97): 1, (166, 116): 1, (178, 32): 1, (150, 116): 1, (169, 104): 1, (171, 205): 3, (149, 101): 1, (101, 205): 2, (152, 121): 1, (121, 210): 1, (153, 32): 5, (160, 111): 1, (176, 118): 1, (118, 205): 1, (204, 182): 2, (182, 102): 1, (102, 204): 2, (148, 225): 1, (178, 111): 1, (133, 119): 1, (119, 204): 1, (186, 32): 1, (156, 116): 2, (204, 184): 3, (184, 104): 1, (104, 205): 1, (179, 205): 3, (141, 101): 1, (160, 32): 1, (169, 204): 4, (156, 196): 2, (170, 204): 6, (185, 110): 2, (162, 205): 2, (157, 115): 1, (154, 204): 3, (157, 112): 1, (112, 205): 1, (187, 97): 1, (153, 99): 1, (99, 210): 1, (150, 105): 1, (165, 205): 2, (161, 110): 1, (159, 103): 1, (103, 204): 1, (184, 204): 1, (174, 204): 4, (149, 97): 1, (156, 110): 2, (157, 100): 1, (161, 32): 1, (133, 99): 1, (151, 114): 1, (180, 205): 1, (179, 101): 1, (159, 97): 1, (153, 200): 1, (200, 155): 1, (155, 205): 1, (148, 205): 3, (133, 101): 1, (97, 205): 1, (129, 97): 1, (177, 112): 1, (112, 204): 3, (142, 205): 3, (160, 112): 1, (186, 196): 1, (196, 153): 1, (171, 97): 1, (175, 205): 4, (156, 114): 2, (152, 97): 1, (150, 110): 1, (158, 99): 1, (150, 101): 1, (147, 205): 2, (153, 111): 1, (170, 102): 1, (180, 32): 1, (204, 161): 2, (161, 204): 1, (164, 226): 1, (184, 205): 1, (156, 111): 1, (111, 205): 1, (205, 143): 1, (143, 204): 1, (174, 114): 1, (172, 114): 1, (175, 112): 1, (162, 116): 1, (133, 105): 1, (182, 205): 1, (185, 111): 1, (161, 205): 1, (148, 110): 1, (133, 226): 1, (169, 46): 1, (46, 204): 1, (147, 32): 3, (32, 86): 2, (86, 111): 1, (40, 117): 1, (45, 116): 4, (104, 41): 1, (105, 113): 2, (113, 113): 2, (100, 58): 6, (58, 9): 2, (9, 215): 2, (215, 144): 2, (144, 214): 1, (214, 182): 3, (182, 215): 3, (215, 170): 6, (32, 215): 12, (215, 147): 4, (147, 214): 1, (214, 183): 3, (183, 215): 1, (215, 156): 4, (156, 214): 2, (214, 176): 2, (176, 215): 2, (170, 214): 2, (214, 180): 5, (180, 214): 2, (214, 188): 3, (188, 215): 3, (215, 153): 10, (215, 148): 4, (148, 214): 2, (214, 181): 2, (181, 215): 2, (215, 150): 4, (150, 214): 1, (180, 215): 3, (153, 215): 5, (150, 32): 2, (215, 160): 2, (160, 214): 1, (215, 162): 2, (162, 214): 1, (183, 44): 1, (215, 167): 2, (167, 214): 1, (215, 152): 2, (152, 214): 1, (215, 145): 2, (145, 32): 2, (215, 169): 4, (169, 214): 1, (215, 129): 2, (129, 215): 2, (215, 155): 2, (155, 214): 1, (183, 214): 1, (153, 214): 1, (214, 184): 1, (184, 215): 1, (169, 215): 3, (215, 149): 2, (149, 214): 1, (214, 185): 1, (185, 215): 1, (41, 58): 1, (144, 215): 1, (147, 215): 1, (156, 215): 2, (170, 215): 2, (148, 215): 2, (150, 215): 1, (160, 215): 1, (162, 44): 1, (167, 215): 1, (152, 215): 1, (155, 215): 1, (149, 215): 1, (83, 97): 1, (107, 114): 1, (156, 224): 2, (224, 164): 4, (164, 185): 2, (185, 226): 2, (128, 139): 1, (139, 224): 1, (164, 191): 2, (191, 226): 2, (185, 224): 1, (40, 226): 2, (156, 104): 5, (156, 105): 1, (105, 226): 2, (121, 108): 3, (106, 97): 4, (111, 46): 1, (225, 132): 1, (132, 146): 1, (146, 226): 1, (225, 133): 1, (133, 161): 1, (161, 226): 2, (225, 134): 1, (134, 171): 1, (171, 226): 1, (156, 237): 1, (237, 149): 1, (149, 156): 1, (97, 226): 1, (103, 226): 1, (148, 100): 1, (46, 103): 3, (156, 199): 1, (199, 161): 1, (40, 100): 1, (196, 129): 1, (129, 204): 1, (204, 135): 1, (86, 105): 1, (116, 110): 1, (70, 117): 4, (80, 97): 2, (69, 66): 1, (66, 57): 1, (57, 32): 2, (225, 186): 1, (186, 185): 1, (48, 50): 3, (204, 130): 3, (130, 226): 3, (48, 69): 1, (69, 65): 1, (195, 170): 1, (170, 226): 1, (51, 32): 4, (163, 226): 3, (48, 54): 2, (156, 102): 1, (111, 98): 1, (116, 45): 1, (156, 78): 2, (78, 70): 7, (70, 68): 2, (68, 226): 1, (70, 67): 3, (67, 226): 1, (109, 44): 2, (67, 32): 2, (68, 41): 1, (70, 75): 2, (75, 68): 1, (68, 32): 1, (75, 67): 1, (67, 46): 1, (156, 75): 1, (75, 226): 1, (156, 117): 1, (85, 65): 1, (65, 88): 1, (88, 32): 1, (32, 35): 1, (35, 50): 1, (50, 57): 1, (111, 120): 1, (100, 59): 1, (90, 87): 2, (87, 74): 2, (74, 32): 2, (103, 58): 2, (108, 119): 1, (121, 105): 1, (153, 100): 1, (121, 59): 1, (79, 116): 1, (148, 104): 1, (107, 45): 1, (80, 101): 1, (114, 104): 1, (112, 115): 1, (45, 109): 1, (100, 98): 1, (104, 119): 1, (69, 118): 1, (69, 101): 1, (73, 67): 1, (67, 85): 1, (85, 32): 1, (148, 67): 1, (67, 47): 1, (47, 67): 1, (67, 43): 1, (43, 43): 1, (43, 47): 1, (47, 74): 1, (104, 109): 1, (80, 121): 1, (71, 111): 1}\n"
-     ]
-    }
-   ],
-   "source": [
-    "def byte_pairs(tokens):\n",
-    "    pairs = {}\n",
-    "    for pair in zip(tokens, tokens[1:]):\n",
-    "        pairs[pair] = pairs.get(pair, 0) + 1\n",
-    "    return pairs            \n",
-    "\n",
-    "stats = byte_pairs(tokens= tokens)\n",
-    "print(stats)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "(101, 32)"
-      ]
-     },
-     "execution_count": 6,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "top_pair = max(stats, key=stats.get)\n",
-    "top_pair"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "24597\n",
-      "23951\n"
-     ]
-    }
-   ],
-   "source": [
-    "def merge(ids, pair, idx):\n",
-    "    newids = []\n",
-    "    id = 0\n",
-    "    while id<len(ids):\n",
-    "        if id< len(ids)-1 and ids[id] == pair[0] and ids[id+1]==pair[1]:\n",
-    "            newids.append(idx)\n",
-    "            id+=2\n",
-    "        else:\n",
-    "            newids.append(ids[id])\n",
-    "            id+=1\n",
-    "            \n",
-    "    return newids\n",
-    "\n",
-    "\n",
-    "tokens2 = merge(tokens, top_pair, 256)\n",
-    "print(len(tokens))\n",
-    "print(len(tokens2))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vocab_size = 500\n",
-    "num_merges = vocab_size - 256\n",
-    "ids = list(tokens)\n",
-    "\n",
-    "merges = {}\n",
-    "\n",
-    "for i in range(num_merges):\n",
-    "    stats = byte_pairs(ids)\n",
-    "    pair = max(stats, key=stats.get)\n",
-    "    idx = 256 + i\n",
-    "    ids = merge(ids, pair, idx)\n",
-    "    merges[pair] = idx"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "{(101, 32): 256,\n",
-       " (105, 110): 257,\n",
-       " (115, 32): 258,\n",
-       " (116, 104): 259,\n",
-       " (101, 114): 260,\n",
-       " (99, 111): 261,\n",
-       " (116, 32): 262,\n",
-       " (226, 128): 263,\n",
-       " (44, 32): 264,\n",
-       " (97, 110): 265,\n",
-       " (111, 114): 266,\n",
-       " (100, 32): 267,\n",
-       " (97, 114): 268,\n",
-       " (101, 110): 269,\n",
-       " (257, 103): 270,\n",
-       " (261, 100): 271,\n",
-       " (121, 32): 272,\n",
-       " (46, 32): 273,\n",
-       " (97, 108): 274,\n",
-       " (259, 256): 275,\n",
-       " (111, 110): 276,\n",
-       " (111, 32): 277,\n",
-       " (116, 105): 278,\n",
-       " (97, 99): 279,\n",
-       " (101, 115): 280,\n",
-       " (111, 102): 281,\n",
-       " (271, 256): 282,\n",
-       " (112, 111): 283,\n",
-       " (270, 32): 284,\n",
-       " (281, 32): 285,\n",
-       " (101, 267): 286,\n",
-       " (116, 260): 287,\n",
-       " (116, 277): 288,\n",
-       " (257, 32): 289,\n",
-       " (97, 32): 290,\n",
-       " (266, 32): 291,\n",
-       " (115, 116): 292,\n",
-       " (111, 117): 293,\n",
-       " (99, 104): 294,\n",
-       " (120, 120): 295,\n",
-       " (101, 120): 296,\n",
-       " (101, 258): 297,\n",
-       " (263, 156): 298,\n",
-       " (263, 157): 299,\n",
-       " (261, 109): 300,\n",
-       " (265, 267): 301,\n",
-       " (112, 108): 302,\n",
-       " (105, 116): 303,\n",
-       " (283, 257): 304,\n",
-       " (114, 101): 305,\n",
-       " (263, 153): 306,\n",
-       " (110, 105): 307,\n",
-       " (274, 108): 308,\n",
-       " (97, 116): 309,\n",
-       " (260, 32): 310,\n",
-       " (105, 258): 311,\n",
-       " (282, 304): 312,\n",
-       " (97, 258): 313,\n",
-       " (85, 307): 314,\n",
-       " (278, 276): 315,\n",
-       " (100, 105): 316,\n",
-       " (111, 119): 317,\n",
-       " (116, 258): 318,\n",
-       " (117, 115): 319,\n",
-       " (299, 32): 320,\n",
-       " (114, 105): 321,\n",
-       " (115, 101): 322,\n",
-       " (115, 105): 323,\n",
-       " (97, 109): 324,\n",
-       " (97, 262): 325,\n",
-       " (114, 111): 326,\n",
-       " (314, 282): 327,\n",
-       " (115, 264): 328,\n",
-       " (121, 121): 329,\n",
-       " (108, 108): 330,\n",
-       " (273, 32): 331,\n",
-       " (265, 32): 332,\n",
-       " (108, 101): 333,\n",
-       " (294, 268): 334,\n",
-       " (279, 287): 335,\n",
-       " (84, 104): 336,\n",
-       " (102, 291): 337,\n",
-       " (97, 98): 338,\n",
-       " (334, 335): 339,\n",
-       " (85, 84): 340,\n",
-       " (340, 70): 341,\n",
-       " (119, 105): 342,\n",
-       " (341, 45): 343,\n",
-       " (85, 43): 344,\n",
-       " (268, 256): 345,\n",
-       " (259, 325): 346,\n",
-       " (97, 112): 347,\n",
-       " (119, 104): 348,\n",
-       " (101, 109): 349,\n",
-       " (115, 117): 350,\n",
-       " (105, 99): 351,\n",
-       " (274, 32): 352,\n",
-       " (97, 115): 353,\n",
-       " (32, 285): 354,\n",
-       " (32, 298): 355,\n",
-       " (105, 262): 356,\n",
-       " (111, 109): 357,\n",
-       " (118, 260): 358,\n",
-       " (292, 114): 359,\n",
-       " (101, 264): 360,\n",
-       " (108, 256): 361,\n",
-       " (278, 99): 362,\n",
-       " (48, 48): 363,\n",
-       " (97, 103): 364,\n",
-       " (97, 315): 365,\n",
-       " (261, 110): 366,\n",
-       " (101, 108): 367,\n",
-       " (295, 295): 368,\n",
-       " (306, 258): 369,\n",
-       " (98, 256): 370,\n",
-       " (294, 32): 371,\n",
-       " (269, 32): 372,\n",
-       " (259, 32): 373,\n",
-       " (113, 117): 374,\n",
-       " (114, 280): 375,\n",
-       " (312, 318): 376,\n",
-       " (116, 296): 377,\n",
-       " (263, 148): 378,\n",
-       " (280, 264): 379,\n",
-       " (330, 32): 380,\n",
-       " (276, 32): 381,\n",
-       " (49, 54): 382,\n",
-       " (98, 257): 383,\n",
-       " (308, 272): 384,\n",
-       " (273, 336): 385,\n",
-       " (300, 283): 386,\n",
-       " (121, 293): 387,\n",
-       " (100, 101): 388,\n",
-       " (265, 272): 389,\n",
-       " (279, 321): 390,\n",
-       " (390, 362): 391,\n",
-       " (103, 104): 392,\n",
-       " (102, 105): 393,\n",
-       " (343, 56): 394,\n",
-       " (266, 109): 395,\n",
-       " (260, 256): 396,\n",
-       " (312, 116): 397,\n",
-       " (269, 271): 398,\n",
-       " (98, 121): 399,\n",
-       " (316, 391): 400,\n",
-       " (103, 114): 401,\n",
-       " (32, 288): 402,\n",
-       " (119, 266): 403,\n",
-       " (265, 103): 404,\n",
-       " (259, 310): 405,\n",
-       " (70, 70): 406,\n",
-       " (269, 116): 407,\n",
-       " (109, 266): 408,\n",
-       " (112, 101): 409,\n",
-       " (117, 108): 410,\n",
-       " (112, 305): 411,\n",
-       " (399, 116): 412,\n",
-       " (122, 122): 413,\n",
-       " (32, 115): 414,\n",
-       " (108, 105): 415,\n",
-       " (269, 262): 416,\n",
-       " (112, 375): 417,\n",
-       " (109, 97): 418,\n",
-       " (49, 49): 419,\n",
-       " (153, 204): 420,\n",
-       " (112, 326): 421,\n",
-       " (273, 73): 422,\n",
-       " (110, 32): 423,\n",
-       " (342, 373): 424,\n",
-       " (112, 279): 425,\n",
-       " (269, 99): 426,\n",
-       " (117, 114): 427,\n",
-       " (32, 32): 428,\n",
-       " (359, 270): 429,\n",
-       " (306, 262): 430,\n",
-       " (116, 97): 431,\n",
-       " (115, 277): 432,\n",
-       " (289, 275): 433,\n",
-       " (333, 116): 434,\n",
-       " (101, 105): 435,\n",
-       " (329, 329): 436,\n",
-       " (204, 178): 437,\n",
-       " (240, 159): 438,\n",
-       " (308, 32): 439,\n",
-       " (317, 32): 440,\n",
-       " (117, 262): 441,\n",
-       " (99, 332): 442,\n",
-       " (110, 111): 443,\n",
-       " (408, 256): 444,\n",
-       " (293, 262): 445,\n",
-       " (105, 108): 446,\n",
-       " (118, 256): 447,\n",
-       " (394, 32): 448,\n",
-       " (121, 264): 449,\n",
-       " (117, 110): 450,\n",
-       " (99, 108): 451,\n",
-       " (115, 273): 452,\n",
-       " (434, 287): 453,\n",
-       " (115, 286): 454,\n",
-       " (300, 383): 455,\n",
-       " (400, 258): 456,\n",
-       " (204, 171): 457,\n",
-       " (259, 311): 458,\n",
-       " (100, 260): 459,\n",
-       " (280, 425): 460,\n",
-       " (343, 382): 461,\n",
-       " (387, 32): 462,\n",
-       " (117, 109): 463,\n",
-       " (110, 101): 464,\n",
-       " (302, 256): 465,\n",
-       " (108, 272): 466,\n",
-       " (45, 98): 467,\n",
-       " (205, 136): 468,\n",
-       " (118, 310): 469,\n",
-       " (265, 100): 470,\n",
-       " (268, 107): 471,\n",
-       " (313, 290): 472,\n",
-       " (105, 109): 473,\n",
-       " (108, 404): 474,\n",
-       " (474, 117): 475,\n",
-       " (475, 364): 476,\n",
-       " (348, 105): 477,\n",
-       " (477, 371): 478,\n",
-       " (98, 272): 479,\n",
-       " (32, 344): 480,\n",
-       " (205, 150): 481,\n",
-       " (205, 135): 482,\n",
-       " (32, 204): 483,\n",
-       " (204, 177): 484,\n",
-       " (32, 301): 485,\n",
-       " (350, 112): 486,\n",
-       " (112, 266): 487,\n",
-       " (314, 271): 488,\n",
-       " (107, 256): 489,\n",
-       " (284, 109): 490,\n",
-       " (115, 357): 491,\n",
-       " (377, 262): 492,\n",
-       " (105, 115): 493,\n",
-       " (303, 272): 494,\n",
-       " (374, 426): 495,\n",
-       " (100, 256): 496,\n",
-       " (312, 262): 497,\n",
-       " (467, 356): 498,\n",
-       " (263, 147): 499}"
-      ]
-     },
-     "execution_count": 9,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "merges"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 10,
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "(24597, 11590, 2.122260569456428)"
-      ]
-     },
-     "execution_count": 10,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "len(tokens), len(ids), len(tokens)/len(ids)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 11,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "PFD\n"
-     ]
-    }
-   ],
-   "source": [
-    "vocab = {idx: bytes([idx]) for idx in range(256)}\n",
-    "for (p0, p1), idx in merges.items():\n",
-    "    vocab[idx] = vocab[p0] + vocab[p1]\n",
-    "    \n",
-    "def decode(ids):\n",
-    "    tokens = b\"\".join(vocab[idx] for idx in ids)\n",
-    "    text = tokens.decode(\"utf-8\", errors=\"replace\")\n",
-    "    return text\n",
-    "\n",
-    "print(decode([80, 70, 68]))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 12,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "[80, 70, 68]\n"
-     ]
-    }
-   ],
-   "source": [
-    "def encode(text):\n",
-    "    tokens = list(text.encode(\"utf-8\"))\n",
-    "    \n",
-    "    while len(tokens)>=2:\n",
-    "        stats = byte_pairs(tokens)\n",
-    "        pair = min(stats, key = lambda p: merges.get(p, float(\"inf\")))\n",
-    "        if pair not in merges:\n",
-    "            break\n",
-    "        idx = merges[pair]\n",
-    "        tokens = merges(tokens, pair, idx)\n",
-    "        \n",
-    "    return tokens\n",
-    "        \n",
-    "        \n",
-    "print(encode(\"PFD\"))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Forcing splits with regex"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 13,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import regex as re # type: ignore"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 14,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "['Hello', \"'ve\", ' world', ' how', '123', ' are', ' you']\n"
-     ]
-    }
-   ],
-   "source": [
-    "gpt2pat = re.compile(r\"\"\"'s|'t|'re|'ve|'m|'ll|'d| ?\\p{L}+| ?\\p{N}+| ?[^\\s\\p{L}\\p{N}]+|\\s+(?!\\S)|\\s+\"\"\")\n",
-    "print(re.findall(gpt2pat, \"Hello've world how123 are you\"))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ML",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.12.3"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/tests/word_tokenization.py b/tests/word_tokenization.py
deleted file mode 100644
index 081618b..0000000
--- a/tests/word_tokenization.py
+++ /dev/null
@@ -1,20 +0,0 @@
-import sys
-import os
-
-# Add the parent directory to the Python path
-sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..', 'data')))
-
-# Import the text variable from the text module
-from text import text
-
-tokenized_text = text.split()
-
-dictionary = list(set(tokenized_text))
-
-wtoi = {w:i for i,w in enumerate(dictionary)}
-itow = {i:w for w, i in wtoi.items()}
-
-encode = lambda text: [wtoi[i] for i in text.split()]
-decode = lambda ids: " ".join(itow[i] for i in ids)
-
-print(decode(encode("Introduction to Unicode")))

From dbbf7bf6f8b20d8eb561079e650b4d1b86a6d288 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 17:55:44 +0400
Subject: [PATCH 10/19] chore: include LICENSE in MANIFEST.in and update
 setup.py for UTF-8 encoding and markdown content type

---
 MANIFEST.in | 3 ++-
 setup.py    | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/MANIFEST.in b/MANIFEST.in
index 4d35845..5ef47fd 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -1,3 +1,4 @@
 include smolbpe/data/*.txt
 include smolbpe/data/*.json
-include README.md
\ No newline at end of file
+include README.md
+include LICENSE
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 575ba49..f77fba8 100644
--- a/setup.py
+++ b/setup.py
@@ -4,7 +4,8 @@
     name='smolbpe',
     version='0.2.0',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
-    long_description=open('README.md').read(),
+    long_description=open('README.md', encoding='utf-8').read(),
+    long_description_content_type='text/markdown', 
     author='Vover',
     author_email='vovatara123@gmail.com',
     url='https://github.com/T4ras123/SmolBPE',

From c358f028143d1e23e28385c7521c82a0dd6ba9a5 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 23:06:58 +0400
Subject: [PATCH 11/19] feat: add badges for version, downloads, stars,
 license, Python versions, and sponsorship to README.md

---
 README.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/README.md b/README.md
index 2846084..5c4f2ce 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,7 @@
 # SmolBPE
 
+![PyPI Version](https://img.shields.io/pypi/v/smolbpe) ![PyPI Downloads](https://img.shields.io/pypi/dm/smolbpe) ![GitHub Stars](https://img.shields.io/github/stars/T4ras123/SmolBPE?style=social) ![License](https://img.shields.io/github/license/T4ras123/SmolBPE) ![Python Versions](https://img.shields.io/pypi/pyversions/smolbpe) ![GitHub code size in bytes](https://img.shields.io/github/languages/code-size/T4ras123/SmolBPE) [![Sponsor](https://img.shields.io/badge/sponsor-GitHub%20Sponsors-critical)](https://github.com/sponsors/T4ras123) [![Twitter Follow](https://img.shields.io/twitter/follow/yourusername?style=social)](https://twitter.com/Vover163) ![PyPI - Downloads](https://img.shields.io/pypi/dt/smolbpe) ![Made with Love](https://img.shields.io/badge/Made%20with-%E2%9D%A4-red)
+
 ## Overview
 
 **SmolBPE** is a lightweight and efficient Byte Pair Encoding (BPE) tokenizer designed for deep learning applications and large language models (LLMs) such as GPT-4. It provides a simple interface to tokenize textual data, facilitating better handling of out-of-vocabulary words and improving the performance of language models.

From 11035c43c3f5c594c2223c0e827ba0471f7898bc Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 23:08:43 +0400
Subject: [PATCH 12/19] fix: reorder badges in README.md for improved clarity

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 5c4f2ce..f8e1905 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # SmolBPE
 
-![PyPI Version](https://img.shields.io/pypi/v/smolbpe) ![PyPI Downloads](https://img.shields.io/pypi/dm/smolbpe) ![GitHub Stars](https://img.shields.io/github/stars/T4ras123/SmolBPE?style=social) ![License](https://img.shields.io/github/license/T4ras123/SmolBPE) ![Python Versions](https://img.shields.io/pypi/pyversions/smolbpe) ![GitHub code size in bytes](https://img.shields.io/github/languages/code-size/T4ras123/SmolBPE) [![Sponsor](https://img.shields.io/badge/sponsor-GitHub%20Sponsors-critical)](https://github.com/sponsors/T4ras123) [![Twitter Follow](https://img.shields.io/twitter/follow/yourusername?style=social)](https://twitter.com/Vover163) ![PyPI - Downloads](https://img.shields.io/pypi/dt/smolbpe) ![Made with Love](https://img.shields.io/badge/Made%20with-%E2%9D%A4-red)
+![PyPI Version](https://img.shields.io/pypi/v/smolbpe) ![PyPI - Downloads](https://img.shields.io/pypi/dm/smolbpe) ![GitHub Stars](https://img.shields.io/github/stars/T4ras123/SmolBPE?style=social) ![License](https://img.shields.io/github/license/T4ras123/SmolBPE) ![Python Versions](https://img.shields.io/pypi/pyversions/smolbpe) ![GitHub code size in bytes](https://img.shields.io/github/languages/code-size/T4ras123/SmolBPE) [![Sponsor](https://img.shields.io/badge/sponsor-GitHub%20Sponsors-critical)](https://github.com/sponsors/T4ras123) [![Twitter Follow](https://img.shields.io/twitter/follow/yourusername?style=social)](https://twitter.com/Vover163) ![PyPI - Downloads](https://img.shields.io/pypi/dt/smolbpe) ![Made with Love](https://img.shields.io/badge/Made%20with-%E2%9D%A4-red)
 
 ## Overview
 

From dd20e82b2cedc4adc543aa40ec5552a7692b35cb Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Sun, 3 Nov 2024 23:10:03 +0400
Subject: [PATCH 13/19] fix: update Twitter badge link in README.md for correct
 username

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index f8e1905..33f98b9 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # SmolBPE
 
-![PyPI Version](https://img.shields.io/pypi/v/smolbpe) ![PyPI - Downloads](https://img.shields.io/pypi/dm/smolbpe) ![GitHub Stars](https://img.shields.io/github/stars/T4ras123/SmolBPE?style=social) ![License](https://img.shields.io/github/license/T4ras123/SmolBPE) ![Python Versions](https://img.shields.io/pypi/pyversions/smolbpe) ![GitHub code size in bytes](https://img.shields.io/github/languages/code-size/T4ras123/SmolBPE) [![Sponsor](https://img.shields.io/badge/sponsor-GitHub%20Sponsors-critical)](https://github.com/sponsors/T4ras123) [![Twitter Follow](https://img.shields.io/twitter/follow/yourusername?style=social)](https://twitter.com/Vover163) ![PyPI - Downloads](https://img.shields.io/pypi/dt/smolbpe) ![Made with Love](https://img.shields.io/badge/Made%20with-%E2%9D%A4-red)
+![PyPI Version](https://img.shields.io/pypi/v/smolbpe) ![PyPI - Downloads](https://img.shields.io/pypi/dm/smolbpe) ![GitHub Stars](https://img.shields.io/github/stars/T4ras123/SmolBPE?style=social) ![License](https://img.shields.io/github/license/T4ras123/SmolBPE) ![Python Versions](https://img.shields.io/pypi/pyversions/smolbpe) ![GitHub code size in bytes](https://img.shields.io/github/languages/code-size/T4ras123/SmolBPE) [![Sponsor](https://img.shields.io/badge/sponsor-GitHub%20Sponsors-critical)](https://github.com/sponsors/T4ras123) [![Twitter Follow](https://img.shields.io/twitter/follow/vover163?style=social)](https://twitter.com/Vover163) ![Made with Love](https://img.shields.io/badge/Made%20with-%E2%9D%A4-red)
 
 ## Overview
 

From d6ab197213e32c1279dddb495b94e223934c7386 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 11:20:19 +0400
Subject: [PATCH 14/19] feat: enhance GPT4Tokenizer to support special tokens
 and improve training logic

---
 .gitignore               |  4 ++-
 smolbpe/gpt4Tokenizer.py | 78 ++++++++++++++++++++++++++++------------
 2 files changed, 58 insertions(+), 24 deletions(-)

diff --git a/.gitignore b/.gitignore
index 9151771..2f83b38 100644
--- a/.gitignore
+++ b/.gitignore
@@ -163,4 +163,6 @@ cython_debug/
 
 
 
-.vscode/*
\ No newline at end of file
+.vscode/*
+smolbpe/text.txt
+smolbpe/vocab.json
diff --git a/smolbpe/gpt4Tokenizer.py b/smolbpe/gpt4Tokenizer.py
index d97a2e1..96ec68a 100644
--- a/smolbpe/gpt4Tokenizer.py
+++ b/smolbpe/gpt4Tokenizer.py
@@ -4,54 +4,84 @@
 
 
 class GPT4Tokenizer():
-    def __init__(self, output='vocab.json', pattern=None):
+    def __init__(self, output='vocab.json', pattern=None, special_tokens=None):
         self.vocab = {idx : bytes([idx]) for idx in range(256)}
         self.merges = dict()
-        self.pattern = pattern if pattern else r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]"
+        self.pattern = pattern if pattern else r"."
         self.splitby = re.compile(self.pattern)
         self.output_file = output
+        self.special_tokens = special_tokens if special_tokens else []
+        self.special_token_ids = {}
+        for i, token in enumerate(self.special_tokens):
+            token_id = 256 + i
+            self.vocab[token_id] = token.encode('utf-8')
+            self.merges[(token_id, token_id)] = token_id
+            self.special_token_ids[token] = token_id
 
 
     def train(self, text, vocab_size):
 
-        assert vocab_size >= 256
-
-        num_merges = vocab_size - 256
-
+        
+        assert vocab_size > len(self.vocab), "Vocab size must be greater than the number of tokens in the vocab"
+        num_merges = vocab_size - len(self.vocab)
         text_splitted = re.findall(self.splitby, text)
-
-        ids = [list(ch.encode("utf-8")) for ch in text_splitted]
-
+        ids = [list(self.encode(chunk)) for chunk in text_splitted]
+        vocab_len = max(self.vocab.keys()) + 1
         for i in range(num_merges):
             stats = {}
             for _ in ids:
                 self.get_pairs(_, stats)
+            if not stats:
+                print(f"No more pairs to merge at iteration {i}. Stopping early.")
+                break
             pair = max(stats, key=stats.get)
-            idx = 256 + i
-            ids = [self.merge(chunk_ids, pair, idx) for chunk_ids in ids]
+            idx = vocab_len + i
             self.merges[pair] = idx
             self.vocab[idx] = self.vocab[pair[0]] + self.vocab[pair[1]]
-        self.save_vocab_and_merges(self.path)
-
+            ids = [self.merge(chunk_ids, pair, idx) for chunk_ids in ids]
+        self.save_vocab_and_merges(self.output_file)
 
     
     def encode(self, text):
-        ids = list(text.encode('utf-8'))
-
+        tokens = []
+        i = 0
+        while i < len(text):
+            matched = False
+            # Check for special tokens at the current position
+            for token in self.special_tokens:
+                if text.startswith(token, i):
+                    token_id = self.special_token_ids[token]
+                    tokens.append(token_id)
+                    i += len(token)
+                    matched = True
+                    break
+            if not matched:
+                # Find the next special token position
+                next_positions = [text.find(st, i) for st in self.special_tokens if text.find(st, i) != -1]
+                next_special = min(next_positions) if next_positions else len(text)
+                # Extract substring up to the next special token
+                substring = text[i:next_special]
+                # Encode the substring using BPE
+                ids = list(substring.encode('utf-8'))
+                ids = self.apply_bpe(ids)
+                tokens.extend(ids)
+                i = next_special
+        return tokens
+    
+    
+    def apply_bpe(self, ids):
         while True:
             pairs = self.get_pairs(ids)
             mergeable_pairs = {p: self.merges[p] for p in pairs if p in self.merges}
 
-
             if not mergeable_pairs:
                 break
 
             pair = min(mergeable_pairs, key=self.merges.get)
-
             ids = self.merge(ids, pair, self.merges[pair])
 
         return ids
-    
+        
     
     def decode(self, ids):
         tokens = b"".join(self.vocab[idx] for idx in ids)
@@ -68,7 +98,7 @@ def get_pairs(self, ids, counts=None):
         return counts
 
 
-    def save_vocab_and_merges(self):
+    def save_vocab_and_merges(self, path):
         data = {
             'vocab': {},
             'merges': {}
@@ -81,9 +111,9 @@ def save_vocab_and_merges(self):
                 data['vocab'][str(idx)] = byte_val.hex()
         # Save merges
         for (first, second), idx in self.merges.items():
-            key = f"{first},{second}"  # Convert tuple to string
+            key = f"{first},{second}" 
             data['merges'][key] = idx
-        with open(self.output_file, 'w', encoding='utf-8') as f:
+        with open(path, 'w', encoding='utf-8') as f:
             json.dump(data, f, indent=2)
             
             
@@ -122,10 +152,12 @@ def merge(self, ids, pair, idx):
     parser.add_argument('-v','--vocab_size', type=int, help='Vocab size for tokenizer')
     parser.add_argument('-o', '--output', default='vocab.json', type=str, help='Output path for vocab and merges')
     parser.add_argument('-p', '--pattern', type=str, help='Regex pattern to split text')
+    parser.add_argument('-s', '--special_tokens', nargs='*', default=None, help='Special tokens to add to vocab')
     args = parser.parse_args()
     
     with open(args.text, 'r') as f:
         args.text = f.read()
-    
-    tokenizer = GPT4Tokenizer(args.output, args.pattern)
+    print(args.special_tokens)
+    tokenizer = GPT4Tokenizer(args.output, args.pattern, special_tokens=args.special_tokens)
     tokenizer.train(args.text, args.vocab_size)
+    print(f"Tokenizer trained and saved to {args.output}")
\ No newline at end of file

From 3a189476b66510d9294e92e154b9edefd1d6c646 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 12:36:50 +0400
Subject: [PATCH 15/19] chore: bump version to 0.3.0 in setup.py

---
 setup.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/setup.py b/setup.py
index f77fba8..756ff44 100644
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 setup(
     name='smolbpe',
-    version='0.2.0',
+    version='0.3.0',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
     long_description=open('README.md', encoding='utf-8').read(),
     long_description_content_type='text/markdown', 
@@ -28,4 +28,4 @@
             'gpt4tokenizer=smolbpe.gpt4Tokenizer:main', 
         ],
     },
-)
\ No newline at end of file
+)

From 503c4ef8fc8b054a680e8561b5e418bc546ebd72 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 12:39:01 +0400
Subject: [PATCH 16/19] refactor: clean up comments and whitespace in
 GPT4Tokenizer

---
 smolbpe/gpt4Tokenizer.py | 9 +--------
 1 file changed, 1 insertion(+), 8 deletions(-)

diff --git a/smolbpe/gpt4Tokenizer.py b/smolbpe/gpt4Tokenizer.py
index 96ec68a..5e7549e 100644
--- a/smolbpe/gpt4Tokenizer.py
+++ b/smolbpe/gpt4Tokenizer.py
@@ -20,8 +20,7 @@ def __init__(self, output='vocab.json', pattern=None, special_tokens=None):
 
 
     def train(self, text, vocab_size):
-
-        
+ 
         assert vocab_size > len(self.vocab), "Vocab size must be greater than the number of tokens in the vocab"
         num_merges = vocab_size - len(self.vocab)
         text_splitted = re.findall(self.splitby, text)
@@ -47,7 +46,6 @@ def encode(self, text):
         i = 0
         while i < len(text):
             matched = False
-            # Check for special tokens at the current position
             for token in self.special_tokens:
                 if text.startswith(token, i):
                     token_id = self.special_token_ids[token]
@@ -56,12 +54,9 @@ def encode(self, text):
                     matched = True
                     break
             if not matched:
-                # Find the next special token position
                 next_positions = [text.find(st, i) for st in self.special_tokens if text.find(st, i) != -1]
                 next_special = min(next_positions) if next_positions else len(text)
-                # Extract substring up to the next special token
                 substring = text[i:next_special]
-                # Encode the substring using BPE
                 ids = list(substring.encode('utf-8'))
                 ids = self.apply_bpe(ids)
                 tokens.extend(ids)
@@ -120,12 +115,10 @@ def save_vocab_and_merges(self, path):
     def load_vocab(self, path='vocab.json'):
         with open(path, 'r', encoding='utf-8') as f:
             data = json.load(f)
-        # Load vocab
         self.vocab = {}
         for idx_str, value in data['vocab'].items():
             idx = idx_str
             self.vocab[idx] = value.encode('utf-8')
-        # Load merges
         self.merges = {}
         for pair_str, idx in data['merges'].items():
             first_str, second_str = pair_str.split(',')

From eb6a3f896809442a068afc3519d939a1af5d5c52 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 12:40:15 +0400
Subject: [PATCH 17/19] feat: migrate GPT4Tokenizer implementation to a new
 file and enhance structure

---
 smolbpe/{gpt4Tokenizer.py => tokenizer.py} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename smolbpe/{gpt4Tokenizer.py => tokenizer.py} (100%)

diff --git a/smolbpe/gpt4Tokenizer.py b/smolbpe/tokenizer.py
similarity index 100%
rename from smolbpe/gpt4Tokenizer.py
rename to smolbpe/tokenizer.py

From 11202855e94dd2d520fcc7a38d44cb239add0b45 Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 12:47:41 +0400
Subject: [PATCH 18/19] feat: update GPT4Tokenizer constructor to set default
 regex pattern and improve argument order

---
 smolbpe/tokenizer.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/smolbpe/tokenizer.py b/smolbpe/tokenizer.py
index 5e7549e..5cf27c7 100644
--- a/smolbpe/tokenizer.py
+++ b/smolbpe/tokenizer.py
@@ -4,10 +4,10 @@
 
 
 class GPT4Tokenizer():
-    def __init__(self, output='vocab.json', pattern=None, special_tokens=None):
+    def __init__(self, output='vocab.json', special_tokens=None, pattern=r"""'(?i:[sdmt]|ll|ve|re)|[^\r\n\p{L}\p{N}]?+\p{L}+|\p{N}{1,3}| ?[^\s\p{L}\p{N}]++[\r\n]*|\s*[\r\n]|\s+(?!\S)|\s+"""):
         self.vocab = {idx : bytes([idx]) for idx in range(256)}
         self.merges = dict()
-        self.pattern = pattern if pattern else r"."
+        self.pattern = pattern
         self.splitby = re.compile(self.pattern)
         self.output_file = output
         self.special_tokens = special_tokens if special_tokens else []
@@ -142,15 +142,15 @@ def merge(self, ids, pair, idx):
 if __name__=='__main__':
     parser = argparse.ArgumentParser()
     parser.add_argument('-t', '--text', type=str, help='Text to train tokenizer on')
-    parser.add_argument('-v','--vocab_size', type=int, help='Vocab size for tokenizer')
+    parser.add_argument('-v', '--vocab_size', type=int, help='Vocab size for tokenizer')
     parser.add_argument('-o', '--output', default='vocab.json', type=str, help='Output path for vocab and merges')
-    parser.add_argument('-p', '--pattern', type=str, help='Regex pattern to split text')
+    parser.add_argument('-p', '--pattern', type=str, default=r"""'(?i:[sdmt]|ll|ve|re)|[^\r\n\p{L}\p{N}]?+\p{L}+|\p{N}{1,3}| ?[^\s\p{L}\p{N}]++[\r\n]*|\s*[\r\n]|\s+(?!\S)|\s+""", help='Regex pattern to split text')
     parser.add_argument('-s', '--special_tokens', nargs='*', default=None, help='Special tokens to add to vocab')
     args = parser.parse_args()
     
     with open(args.text, 'r') as f:
         args.text = f.read()
     print(args.special_tokens)
-    tokenizer = GPT4Tokenizer(args.output, args.pattern, special_tokens=args.special_tokens)
+    tokenizer = GPT4Tokenizer(args.output, special_tokens=args.special_tokens, pattern=args.pattern)
     tokenizer.train(args.text, args.vocab_size)
     print(f"Tokenizer trained and saved to {args.output}")
\ No newline at end of file

From fba88fa6c150f40109b106012195ea452566217a Mon Sep 17 00:00:00 2001
From: T4ras123 <vovatara123@gmail.com>
Date: Mon, 4 Nov 2024 12:59:35 +0400
Subject: [PATCH 19/19] feat: rename GPT4Tokenizer to Tokenizer and update
 README and setup.py

---
 .gitignore           |  1 +
 README.md            | 14 +++++++-------
 setup.py             |  2 +-
 smolbpe/tokenizer.py |  4 ++--
 4 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/.gitignore b/.gitignore
index 2f83b38..aee1f37 100644
--- a/.gitignore
+++ b/.gitignore
@@ -166,3 +166,4 @@ cython_debug/
 .vscode/*
 smolbpe/text.txt
 smolbpe/vocab.json
+test.py
diff --git a/README.md b/README.md
index 33f98b9..9ce36f2 100644
--- a/README.md
+++ b/README.md
@@ -38,19 +38,19 @@ pip install .
 1.Importing the Tokenizer
 
   ```python
-  from smolbpe.gpt4Tokenizer import GPT4Tokenizer
+  from smolbpe.tokenizer import Tokenizer
   ```
 
 2.Initializing the Tokenizer
 
   ```python
-  tokenizer = GPT4Tokenizer()
+  tokenizer = Tokenizer()
   ```
 
   You can specify a custom output file to save the vocab file to and regex pattern if needed:
 
   ```python
-  tokenizer = GPT4Tokenizer(output='vocab.json', pattern=r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]")
+  tokenizer = Tokenizer(output='vocab.json', pattern=r"\p{L}+|\p{Z}+|\p{N}+|[\p{P}&&[^.]]")
   ```
 
 3.Training the Tokenizer
@@ -89,7 +89,7 @@ SmolBPE provides a command-line interface for easy tokenization tasks.
 #### Training the Tokenizer
 
 ```sh
-gpt4tokenizer --text data/taylorswift.txt --vocab_size 400 --output vocab.json
+tokenizer --text smth.txt --vocab_size 400 --output vocab.json 
 ```
 
 ## Advanced Usage
@@ -99,7 +99,7 @@ gpt4tokenizer --text data/taylorswift.txt --vocab_size 400 --output vocab.json
 If you have a pre-trained vocabulary and merges file, you can load them directly:
 
 ```python
-tokenizer = GPT4Tokenizer()
+tokenizer = Tokenizer()
 tokenizer.load_vocab('vocab.json')
 ```
 
@@ -109,7 +109,7 @@ Customize the tokenization by providing a different regex pattern:
 
 ```python
 custom_pattern = r"\w+|\s+|[^\s\w]+"
-tokenizer = GPT4Tokenizer(pattern=custom_pattern)
+tokenizer = Tokenizer(pattern=custom_pattern)
 ```
 
 ## Project Structure
@@ -118,7 +118,7 @@ tokenizer = GPT4Tokenizer(pattern=custom_pattern)
 SmolBPE/
 ├── smolbpe/
 │   ├── __init__.py
-│   └── gpt4Tokenizer.py
+│   └── tokenizer.py
 ├── LICENSE
 ├── MANIFEST.in
 ├── README.md
diff --git a/setup.py b/setup.py
index 756ff44..9734021 100644
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 setup(
     name='smolbpe',
-    version='0.3.0',
+    version='0.3.1',
     description='A GPT-4 compatible Byte Pair Encoding (BPE) tokenizer.',
     long_description=open('README.md', encoding='utf-8').read(),
     long_description_content_type='text/markdown', 
diff --git a/smolbpe/tokenizer.py b/smolbpe/tokenizer.py
index 5cf27c7..ed3d3b2 100644
--- a/smolbpe/tokenizer.py
+++ b/smolbpe/tokenizer.py
@@ -3,7 +3,7 @@
 import json
 
 
-class GPT4Tokenizer():
+class Tokenizer():
     def __init__(self, output='vocab.json', special_tokens=None, pattern=r"""'(?i:[sdmt]|ll|ve|re)|[^\r\n\p{L}\p{N}]?+\p{L}+|\p{N}{1,3}| ?[^\s\p{L}\p{N}]++[\r\n]*|\s*[\r\n]|\s+(?!\S)|\s+"""):
         self.vocab = {idx : bytes([idx]) for idx in range(256)}
         self.merges = dict()
@@ -151,6 +151,6 @@ def merge(self, ids, pair, idx):
     with open(args.text, 'r') as f:
         args.text = f.read()
     print(args.special_tokens)
-    tokenizer = GPT4Tokenizer(args.output, special_tokens=args.special_tokens, pattern=args.pattern)
+    tokenizer = Tokenizer(args.output, special_tokens=args.special_tokens, pattern=args.pattern)
     tokenizer.train(args.text, args.vocab_size)
     print(f"Tokenizer trained and saved to {args.output}")
\ No newline at end of file