pytorch
diff --git a/‎.ci/scripts/test_llama.sh
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/test_llama.sh
Lines changed: 1 addition & 1 deletion
diff --git a/‎.ci/scripts/test_llama_torchao_lowbit.sh
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/test_llama_torchao_lowbit.sh
Lines changed: 1 addition & 1 deletion
diff --git a/‎.ci/scripts/test_phi_3_mini.sh
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/test_phi_3_mini.sh
Lines changed: 1 addition & 1 deletion
diff --git a/‎.ci/scripts/test_qnn_static_llama.sh
Lines changed: 1 addition & 1 deletion b/‎.ci/scripts/test_qnn_static_llama.sh
Lines changed: 1 addition & 1 deletion
diff --git a/‎CMakeLists.txt
Lines changed: 1 addition & 1 deletion b/‎CMakeLists.txt
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/models/llama/TARGETS
Lines changed: 1 addition & 1 deletion b/‎examples/models/llama/TARGETS
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/models/llama/eval_llama_lib.py
Lines changed: 3 additions & 5 deletions b/‎examples/models/llama/eval_llama_lib.py
Lines changed: 3 additions & 5 deletions
diff --git a/‎examples/models/llama/evaluate/eager_eval.py
Lines changed: 2 additions & 4 deletions b/‎examples/models/llama/evaluate/eager_eval.py
Lines changed: 2 additions & 4 deletions
diff --git a/‎examples/models/llama/runner/generation.py
Lines changed: 1 addition & 1 deletion b/‎examples/models/llama/runner/generation.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/models/llama/tokenizer/targets.bzl
Lines changed: 0 additions & 1 deletion b/‎examples/models/llama/tokenizer/targets.bzl
Lines changed: 0 additions & 1 deletion
diff --git a/‎examples/models/llama/tokenizer/test/test_tiktoken.cpp
Lines changed: 5 additions & 5 deletions b/‎examples/models/llama/tokenizer/test/test_tiktoken.cpp
Lines changed: 5 additions & 5 deletions
diff --git a/‎examples/models/llava/export_llava.py
Lines changed: 1 addition & 1 deletion b/‎examples/models/llava/export_llava.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/qualcomm/oss_scripts/llama/CMakeLists.txt
Lines changed: 2 additions & 2 deletions b/‎examples/qualcomm/oss_scripts/llama/CMakeLists.txt
Lines changed: 2 additions & 2 deletions
diff --git a/‎extension/llm/export/TARGETS
Lines changed: 1 addition & 1 deletion b/‎extension/llm/export/TARGETS
Lines changed: 1 addition & 1 deletion
diff --git a/‎extension/llm/export/builder.py
Lines changed: 1 addition & 1 deletion b/‎extension/llm/export/builder.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎extension/llm/tokenizer/CMakeLists.txt
Lines changed: 0 additions & 62 deletions b/‎extension/llm/tokenizer/CMakeLists.txt
Lines changed: 0 additions & 62 deletions
diff --git a/‎extension/llm/tokenizer/TARGETS
Lines changed: 0 additions & 8 deletions b/‎extension/llm/tokenizer/TARGETS
Lines changed: 0 additions & 8 deletions
diff --git a/‎extension/llm/tokenizer/__init__.py b/‎extension/llm/tokenizer/__init__.py
@@ -269,7 +269,7 @@ $PYTHON_EXECUTABLE -m examples.models.llama.export_llama ${EXPORT_ARGS}
 
 # Create tokenizer.bin.
 echo "Creating tokenizer.bin"
-$PYTHON_EXECUTABLE -m extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
+$PYTHON_EXECUTABLE -m pytorch_tokenizers.tools.llama2c.convert -t tokenizer.model -o tokenizer.bin
 
 
 RUNTIME_ARGS="--model_path=${EXPORTED_MODEL_NAME} --tokenizer_path=tokenizer.bin --prompt=Once --temperature=0 --seq_len=10 --warmup=1"
 
@@ -55,7 +55,7 @@ cmake --build cmake-out/examples/models/llama -j16 --config Release
 download_stories_model_artifacts
 
 echo "Creating tokenizer.bin"
-$PYTHON_EXECUTABLE -m extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
+$PYTHON_EXECUTABLE -m pytorch_tokenizers.tools.llama2c.convert -t tokenizer.model -o tokenizer.bin
 
 # Export model
 LLAMA_CHECKPOINT=stories110M.pt
 
@@ -56,7 +56,7 @@ cmake_build_phi_3_mini() {
 prepare_tokenizer() {
   echo "Downloading and converting tokenizer.model"
   wget -O tokenizer.model "https://huggingface.co/microsoft/Phi-3-mini-128k-instruct/resolve/main/tokenizer.model?download=true"
-  $PYTHON_EXECUTABLE -m executorch.extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
+  $PYTHON_EXECUTABLE -m pytorch_tokenizers.tools.llama2c.convert -t tokenizer.model -o tokenizer.bin
 }
 
 # Export phi-3-mini model to pte
 
@@ -30,7 +30,7 @@ pip install graphviz
 # Download stories llama110m artifacts
 download_stories_model_artifacts
 echo "Creating tokenizer.bin"
-$PYTHON_EXECUTABLE -m extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
+$PYTHON_EXECUTABLE -m pytorch_tokenizers.tools.llama2c.convert -t tokenizer.model -o tokenizer.bin
 
 set +e
 # Compile only as weight sharing is not applicable on x86
 
@@ -757,7 +757,7 @@ if(EXECUTORCH_BUILD_EXTENSION_FLAT_TENSOR)
 endif()
 
 if(EXECUTORCH_BUILD_EXTENSION_LLM)
-  add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/extension/llm/tokenizer)
+  add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/extension/llm/tokenizers)
 endif()
 
 if(EXECUTORCH_BUILD_EXTENSION_MODULE)
 
@@ -202,7 +202,7 @@ runtime.python_library(
         ":export_library",
         "//executorch/examples/models/llama/tokenizer:tiktoken_py",
         "//executorch/extension/llm/export:export_lib",
-        "//executorch/extension/llm/tokenizer:tokenizer_py_lib",
+        "//pytorch/tokenizers/pytorch_tokenizers:tokenizers",
         "//executorch/extension/pybindings:portable_lib",
     ],
 )
 
@@ -15,14 +15,12 @@
 from executorch.examples.models.llama.export_llama_lib import (
     get_quantizer_and_quant_params,
 )
-from executorch.examples.models.llama.tokenizer.tiktoken import Tokenizer as Tiktoken
 
 from executorch.extension.llm.export.builder import LLMEdgeManager
-from executorch.extension.llm.tokenizer.tokenizer import (
-    Tokenizer as SentencePieceTokenizer,
-)
-from executorch.extension.llm.tokenizer.utils import get_tokenizer
 from lm_eval.evaluator import simple_evaluate
+from pytorch_tokenizers import get_tokenizer
+from pytorch_tokenizers.llama2c import Llama2cTokenizer as SentencePieceTokenizer
+from pytorch_tokenizers.tiktoken import TiktokenTokenizer as Tiktoken
 from torch.nn import CrossEntropyLoss
 from tqdm import tqdm
 
 
@@ -8,12 +8,10 @@
 from typing import Optional, Union
 
 import torch
-from executorch.examples.models.llama.tokenizer.tiktoken import Tokenizer as Tiktoken
-from executorch.extension.llm.tokenizer.tokenizer import (
-    Tokenizer as SentencePieceTokenizer,
-)
 
 from lm_eval.models.huggingface import HFLM as eval_wrapper
+from pytorch_tokenizers.llama2c import Llama2cTokenizer as SentencePieceTokenizer
+from pytorch_tokenizers.tiktoken import TiktokenTokenizer as Tiktoken
 
 from torch import nn
 
 
@@ -10,7 +10,7 @@
 
 import torch
 
-from executorch.extension.llm.tokenizer.utils import get_tokenizer
+from pytorch_tokenizers import get_tokenizer
 
 
 def sample_top_p(probs, p):
 
@@ -16,7 +16,6 @@ def define_common_targets():
         ],
         exported_deps = [
             "//pytorch/tokenizers:tiktoken",
-            "//executorch/extension/llm/tokenizer:tiktoken", # TODO: remove
         ],
         visibility = [
             "@EXECUTORCH_CLIENTS",
 
@@ -10,7 +10,7 @@
 
 #include <vector>
 
-#include <executorch/extension/llm/tokenizer/tiktoken.h>
+#include <pytorch/tokenizers/tiktoken.h>
 
 #include <gtest/gtest.h>
 
@@ -21,9 +21,9 @@
 using namespace ::testing;
 
 using ::example::Version;
-using ::executorch::extension::llm::Tokenizer;
-using ::executorch::runtime::Error;
-using ::executorch::runtime::Result;
+using ::tokenizers::Error;
+using ::tokenizers::Result;
+using ::tokenizers::Tokenizer;
 
 static std::string get_resource_path(const std::string& name) {
 #ifdef EXECUTORCH_FB_BUCK
@@ -36,7 +36,7 @@ static std::string get_resource_path(const std::string& name) {
 class MultimodalTiktokenV5ExtensionTest : public Test {
  public:
   void SetUp() override {
-    tokenizer_ = std::make_unique<executorch::extension::llm::Tiktoken>(
+    tokenizer_ = std::make_unique<tokenizers::Tiktoken>(
         example::get_multimodal_special_tokens(), 0, 1);
     modelPath_ = get_resource_path("test_tiktoken_tokenizer.model");
   }
 
@@ -46,8 +46,8 @@
 )
 
 from executorch.extension.llm.export.builder import DType, LLMEdgeManager
-from executorch.extension.llm.tokenizer.tokenizer import Tokenizer
 from executorch.util.activation_memory_profiler import generate_memory_trace
+from pytorch_tokenizers.llama2c import Llama2cTokenizer as Tokenizer
 from torch.export import Dim
 from torch.nn.attention import SDPBackend
 
 
@@ -5,7 +5,7 @@
 # LICENSE file in the root directory of this source tree.
 
 # model sharding with custom op
-set(CUSTOM_OP_SRCS_FILE 
+set(CUSTOM_OP_SRCS_FILE
   "${EXECUTORCH_SOURCE_DIR}/extension/llm/custom_ops/op_fallback.cpp"
 )
 add_library(custom_ops ${CUSTOM_OP_SRCS_FILE})
@@ -35,7 +35,7 @@ list(
 list(
   APPEND
   _llama_runner__srcs
-  ${CMAKE_CURRENT_SOURCE_DIR}/../../../../extension/llm/tokenizer/tiktoken.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/../../../../extension/llm/tokenizers/src/tiktoken.cpp
   ${CMAKE_CURRENT_SOURCE_DIR}/../../../models/llama/tokenizer/llama_tiktoken.cpp
 )
 
 
@@ -40,6 +40,6 @@ runtime.python_library(
         "//executorch/exir:lib",
         "//executorch/exir/backend:backend_details",
         "//executorch/extension/export_util:export_util",
-        "//executorch/extension/llm/tokenizer:tokenizer_py_lib",
+        "//pytorch/tokenizers/pytorch_tokenizers:tokenizers",
     ],
 )
@@ -35,7 +35,7 @@
 from executorch.extension.export_util.utils import export_to_edge, save_pte_program
 
 from executorch.extension.llm.export.export_passes import RemoveRedundantTransposes
-from executorch.extension.llm.tokenizer.utils import get_tokenizer
+from pytorch_tokenizers import get_tokenizer
 from torch.ao.quantization.quantize_pt2e import convert_pt2e, prepare_pt2e
 from torch.ao.quantization.quantizer import Quantizer
 from torch.ao.quantization.quantizer.composable_quantizer import ComposableQuantizer
Original file line number	Diff line number	Diff line change
`@@ -56,7 +56,7 @@ cmake_build_phi_3_mini() {`
`56`	`56`	`prepare_tokenizer() {`
`57`	`57`	`echo "Downloading and converting tokenizer.model"`
`58`	`58`	`wget -O tokenizer.model "https://huggingface.co/microsoft/Phi-3-mini-128k-instruct/resolve/main/tokenizer.model?download=true"`
`59`		`- $PYTHON_EXECUTABLE -m executorch.extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin`
	`59`	`+ $PYTHON_EXECUTABLE -m pytorch_tokenizers.tools.llama2c.convert -t tokenizer.model -o tokenizer.bin`
`60`	`60`	`}`
`61`	`61`
`62`	`62`	`# Export phi-3-mini model to pte`
Original file line number	Diff line number	Diff line change
`@@ -202,7 +202,7 @@ runtime.python_library(`
`202`	`202`	`":export_library",`
`203`	`203`	`"//executorch/examples/models/llama/tokenizer:tiktoken_py",`
`204`	`204`	`"//executorch/extension/llm/export:export_lib",`
`205`		`- "//executorch/extension/llm/tokenizer:tokenizer_py_lib",`
	`205`	`+ "//pytorch/tokenizers/pytorch_tokenizers:tokenizers",`
`206`	`206`	`"//executorch/extension/pybindings:portable_lib",`
`207`	`207`	`],`
`208`	`208`	`)`
Original file line number	Diff line number	Diff line change
`@@ -46,8 +46,8 @@`
`46`	`46`	`)`
`47`	`47`
`48`	`48`	`from executorch.extension.llm.export.builder import DType, LLMEdgeManager`
`49`		`-from executorch.extension.llm.tokenizer.tokenizer import Tokenizer`
`50`	`49`	`from executorch.util.activation_memory_profiler import generate_memory_trace`
	`50`	`+from pytorch_tokenizers.llama2c import Llama2cTokenizer as Tokenizer`
`51`	`51`	`from torch.export import Dim`
`52`	`52`	`from torch.nn.attention import SDPBackend`
`53`	`53`
Original file line number	Diff line number	Diff line change
`@@ -40,6 +40,6 @@ runtime.python_library(`
`40`	`40`	`"//executorch/exir:lib",`
`41`	`41`	`"//executorch/exir/backend:backend_details",`
`42`	`42`	`"//executorch/extension/export_util:export_util",`
`43`		`- "//executorch/extension/llm/tokenizer:tokenizer_py_lib",`
	`43`	`+ "//pytorch/tokenizers/pytorch_tokenizers:tokenizers",`
`44`	`44`	`],`
`45`	`45`	`)`