diff --git a/semantic_router/splitters/__init__.py b/semantic_router/splitters/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/semantic_router/splitters/base.py b/semantic_router/splitters/base.py
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/semantic_router/splitters/cav_sim.py b/semantic_router/splitters/cav_sim.py
new file mode 100644
index 0000000000000000000000000000000000000000..67afac63befd8397443f08fcc0220b23bdc046db
--- /dev/null
+++ b/semantic_router/splitters/cav_sim.py
@@ -0,0 +1,4 @@
+
+"""
+cav_sim stands for "cumulative average vector similarity", as in this code the cumulative average of the embedding vectors are compared to the next embedding vector. 
+"""
\ No newline at end of file
diff --git a/semantic_router/splitters/consecutive_sim.py b/semantic_router/splitters/consecutive_sim.py
new file mode 100644
index 0000000000000000000000000000000000000000..892f7d1881473a7bee5a612544234904e07d9f51
--- /dev/null
+++ b/semantic_router/splitters/consecutive_sim.py
@@ -0,0 +1,3 @@
+"""
+Called "consecutive sim" because we check the similarities of consecutive document embeddings (compare ith to i+1th document embedding).
+"""
\ No newline at end of file
diff --git a/semantic_router/splitters/cumulative_sim.py b/semantic_router/splitters/cumulative_sim.py
new file mode 100644
index 0000000000000000000000000000000000000000..7c7c35b7da6f30b338a178caaebf6b6bbfc9c46f
--- /dev/null
+++ b/semantic_router/splitters/cumulative_sim.py
@@ -0,0 +1,3 @@
+"""
+Called "cumulative sim" because we check the similarities of the embeddings of cumulative concatenated documents with the next document.
+"""
\ No newline at end of file