diff --git a/main/hugectr_contributor_guide.html b/main/hugectr_contributor_guide.html
index fea5d517cc..390475ce1d 100644
--- a/main/hugectr_contributor_guide.html
+++ b/main/hugectr_contributor_guide.html
@@ -196,10 +196,10 @@
$ mkdir -p build && cd build
$ cmake -DCMAKE_BUILD_TYPE=Release -DSM=80 .. # Target is NVIDIA A100
@@ -212,7 +212,7 @@ Build HugeCTR Training Container from Source
diff --git a/main/searchindex.js b/main/searchindex.js
index 3a1fdc6ec4..c40c67685d 100644
--- a/main/searchindex.js
+++ b/main/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"docnames": ["QAList", "additional_resources", "api/hugectr_layer_book", "api/index", "api/python_interface", "hierarchical_parameter_server/hps_database_backend", "hierarchical_parameter_server/hps_dlrm_benchmark", "hierarchical_parameter_server/hps_tf_api/index", "hierarchical_parameter_server/hps_tf_api/initialize", "hierarchical_parameter_server/hps_tf_api/layers", "hierarchical_parameter_server/hps_tf_user_guide", "hierarchical_parameter_server/hps_torch_api/index", "hierarchical_parameter_server/hps_torch_api/lookup_layer", "hierarchical_parameter_server/hps_torch_user_guide", "hierarchical_parameter_server/hps_trt_api/hps_plugin", "hierarchical_parameter_server/hps_trt_api/hps_plugin_creator", "hierarchical_parameter_server/hps_trt_api/index", "hierarchical_parameter_server/hps_trt_user_guide", "hierarchical_parameter_server/index", "hierarchical_parameter_server/profiling_hps", "hps_tf/notebooks/hierarchical_parameter_server_demo", "hps_tf/notebooks/hps_multi_table_sparse_input_demo", "hps_tf/notebooks/hps_pretrained_model_training_demo", "hps_tf/notebooks/hps_table_fusion_demo", "hps_tf/notebooks/hps_tensorflow_triton_deployment_demo", "hps_tf/notebooks/index", "hps_tf/notebooks/sok_to_hps_dlrm_demo", "hps_tf/notebooks/sok_train_demo", "hps_torch/notebooks/hps_torch_demo", "hps_torch/notebooks/index", "hps_trt/notebooks/benchmark_tf_trained_large_model", "hps_trt/notebooks/demo_for_hugectr_trained_model", "hps_trt/notebooks/demo_for_pytorch_trained_model", "hps_trt/notebooks/demo_for_tf_trained_model", "hps_trt/notebooks/index", "hugectr_contributor_guide", "hugectr_core_features", "hugectr_talks_blogs", "hugectr_user_guide", "index", "notebooks/embedding_collection", "notebooks/hps_demo", "notebooks/hugectr_e2e_demo_with_nvtabular", "notebooks/index", "notebooks/multi-modal-data/00-Intro", "notebooks/multi-modal-data/01-Download-Convert", "notebooks/multi-modal-data/02-Data-Enrichment", "notebooks/multi-modal-data/03-Feature-Extraction-Poster", "notebooks/multi-modal-data/04-Feature-Extraction-Text", "notebooks/multi-modal-data/05-Create-Feature-Store", "notebooks/multi-modal-data/06-ETL-with-NVTabular", "notebooks/multi-modal-data/07-Training-with-HugeCTR", "notebooks/multi-modal-data/index", "notebooks/training_with_remote_filesystem", "performance", "release_notes", "sparse_operation_kit"], "filenames": ["QAList.md", "additional_resources.md", "api/hugectr_layer_book.md", "api/index.rst", "api/python_interface.md", "hierarchical_parameter_server/hps_database_backend.md", "hierarchical_parameter_server/hps_dlrm_benchmark.md", "hierarchical_parameter_server/hps_tf_api/index.rst", "hierarchical_parameter_server/hps_tf_api/initialize.rst", "hierarchical_parameter_server/hps_tf_api/layers.rst", "hierarchical_parameter_server/hps_tf_user_guide.md", "hierarchical_parameter_server/hps_torch_api/index.rst", "hierarchical_parameter_server/hps_torch_api/lookup_layer.md", "hierarchical_parameter_server/hps_torch_user_guide.md", "hierarchical_parameter_server/hps_trt_api/hps_plugin.md", "hierarchical_parameter_server/hps_trt_api/hps_plugin_creator.md", "hierarchical_parameter_server/hps_trt_api/index.rst", "hierarchical_parameter_server/hps_trt_user_guide.md", "hierarchical_parameter_server/index.md", "hierarchical_parameter_server/profiling_hps.md", "hps_tf/notebooks/hierarchical_parameter_server_demo.ipynb", "hps_tf/notebooks/hps_multi_table_sparse_input_demo.ipynb", "hps_tf/notebooks/hps_pretrained_model_training_demo.ipynb", "hps_tf/notebooks/hps_table_fusion_demo.ipynb", "hps_tf/notebooks/hps_tensorflow_triton_deployment_demo.ipynb", "hps_tf/notebooks/index.md", "hps_tf/notebooks/sok_to_hps_dlrm_demo.ipynb", "hps_tf/notebooks/sok_train_demo.ipynb", "hps_torch/notebooks/hps_torch_demo.ipynb", "hps_torch/notebooks/index.md", "hps_trt/notebooks/benchmark_tf_trained_large_model.ipynb", "hps_trt/notebooks/demo_for_hugectr_trained_model.ipynb", "hps_trt/notebooks/demo_for_pytorch_trained_model.ipynb", "hps_trt/notebooks/demo_for_tf_trained_model.ipynb", "hps_trt/notebooks/index.md", "hugectr_contributor_guide.md", "hugectr_core_features.md", "hugectr_talks_blogs.md", "hugectr_user_guide.md", "index.rst", "notebooks/embedding_collection.ipynb", "notebooks/hps_demo.ipynb", "notebooks/hugectr_e2e_demo_with_nvtabular.ipynb", "notebooks/index.md", "notebooks/multi-modal-data/00-Intro.ipynb", "notebooks/multi-modal-data/01-Download-Convert.ipynb", "notebooks/multi-modal-data/02-Data-Enrichment.ipynb", "notebooks/multi-modal-data/03-Feature-Extraction-Poster.ipynb", "notebooks/multi-modal-data/04-Feature-Extraction-Text.ipynb", "notebooks/multi-modal-data/05-Create-Feature-Store.ipynb", "notebooks/multi-modal-data/06-ETL-with-NVTabular.ipynb", "notebooks/multi-modal-data/07-Training-with-HugeCTR.ipynb", "notebooks/multi-modal-data/index.md", "notebooks/training_with_remote_filesystem.ipynb", "performance.md", "release_notes.md", "sparse_operation_kit.md"], "titles": ["Questions and Answers", "Additional Resources", "HugeCTR Layer Classes and Methods", "HugeCTR API Documentation", "HugeCTR Python Interface", "Hierarchical Parameter Server Database Backend", "Benchmark the DLRM Model with HPS", "Hierarchical Parameter Server API", "HPS Initialize", "HPS Layers", "Hierarchical Parameter Server Plugin for TensorFlow", "HPS Plugin for Torch API", "HPS Plugin for Torch", "Hierarchical Parameter Server Plugin for Torch", "HPS Plugin", "HPS Plugin Creator", "HPS Plugin for TensorRT API", "Hierarchical Parameter Server Plugin for TensorRT", "Hierarchical Parameter Server", "Profiling HPS", "Hierarchical Parameter Server Demo", "HPS for Multiple Tables and Sparse Inputs", "HPS Pretrained Model Training Demo", "HPS Table Fusion Demo", "Deploy SavedModel using HPS with Triton TensorFlow Backend", "Hierarchical Parameter Server Notebooks", "SOK to HPS DLRM Demo", "SOK Train DLRM Demo", "HPS Torch Demo", "Hierarchical Parameter Server Notebooks", "HPS TensorRT Plugin Benchmark for TensorFlow Large Model", "HPS TensorRT Plugin Demo for HugeCTR Trained Model", "HPS TensorRT Plugin Demo for PyTorch Trained Model", "HPS TensorRT Plugin Demo for TensorFlow Trained Model", "HPS Plugin for TensorRT Notebooks", "Contributing to HugeCTR", "HugeCTR Core Features", "HugeCTR Talks and Blogs", "Introduction to HugeCTR", "Merlin HugeCTR", "HugeCTR Embedding Collection", "Hierarchical Parameter Server Demo", "HugeCTR End-end Example with NVTabular", "HugeCTR Example Notebooks", "Training Recommender Systems on Multi-modal Data", "MovieLens-25M: Download and Convert", "MovieLens Data Enrichment", "Movie Poster Feature Extraction with ResNet", "Movie Synopsis Feature Extraction with Bart text summarization", "Creating Multi-Modal Movie Feature Store", "ETL with NVTabular", "Training HugeCTR Model with Pre-trained Embeddings", "Multi-modal Example Notebooks", "HugeCTR Training with Remote File System Example", "Performance", "Release Notes", "Sparse Operation Kit"], "terms": {"try": [0, 5, 31, 36, 41, 46, 47, 55], "provid": [0, 2, 4, 5, 10, 13, 17, 18, 20, 21, 22, 25, 26, 28, 29, 30, 31, 34, 35, 36, 38, 39, 40, 41, 43, 44, 50, 52, 53, 54, 55, 56], "recommend": [0, 2, 4, 5, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 37, 38, 39, 43, 45, 50, 52, 55], "variou": [0, 5, 13, 36, 38], "industri": [0, 36], "high": [0, 3, 5, 10, 13, 17, 18, 20, 21, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 46, 50, 54, 55], "effici": [0, 4, 5, 13, 22, 30, 54, 55], "solut": [0, 18, 36, 38, 55], "onlin": [0, 4, 5, 8, 10, 30, 36, 55], "offlin": [0, 4, 5, 43, 55], "also": [0, 2, 4, 5, 6, 14, 19, 20, 21, 22, 24, 25, 26, 30, 36, 38, 40, 41, 43, 44, 46, 50, 51, 55], "refer": [0, 2, 4, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 44, 53, 55], "design": [0, 2, 4, 5, 13, 35, 36, 37, 38, 39, 50, 55, 56], "develop": [0, 5, 25, 29, 34, 36, 37, 39, 40, 43, 55], "want": [0, 2, 4, 5, 9, 30, 34, 35, 36, 45, 50, 53, 55], "port": [0, 4, 5, 25, 29, 30, 34, 41, 42, 43, 53, 55], "optim": [0, 2, 4, 19, 20, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 33, 37, 40, 41, 42, 51, 53, 54, 55], "current": [0, 2, 4, 8, 20, 21, 22, 26, 30, 32, 33, 38, 41, 45, 46, 47, 50, 53, 55], "v2": [0, 2, 4, 24, 47, 55], "dnn": [0, 20, 21, 22, 23, 24, 36, 54, 55, 56], "wdl": [0, 5, 19, 38, 41, 54], "dcn": [0, 2, 4, 36, 38, 54, 55], "deepfm": [0, 38, 55], "dlrm": [0, 10, 17, 25, 30, 31, 32, 33, 38, 54, 55], "variant": [0, 30, 38, 55], "wide": [0, 38, 54, 55], "system": [0, 2, 4, 5, 10, 13, 17, 18, 20, 21, 22, 23, 24, 27, 28, 31, 32, 33, 35, 36, 37, 38, 41, 45, 50, 51, 52, 54, 55], "directori": [0, 4, 5, 10, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 47, 50, 54, 55], "repositori": [0, 4, 10, 18, 19, 24, 31, 32, 33, 35, 36, 38, 39, 40, 41, 53, 54, 55], "github": [0, 4, 19, 23, 25, 28, 29, 30, 33, 34, 35, 36, 38, 39, 40, 41, 43, 47, 50, 53, 54, 55], "them": [0, 2, 4, 9, 13, 20, 21, 22, 23, 24, 26, 30, 35, 50, 55], "express": [0, 2, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "confin": 0, "aforement": [0, 2], "you": [0, 2, 4, 5, 8, 9, 10, 13, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 49, 50, 53, 55, 56], "your": [0, 2, 4, 5, 10, 13, 17, 19, 22, 25, 29, 30, 31, 32, 33, 34, 36, 38, 41, 43, 53, 55], "own": [0, 2, 25, 29, 34, 38], "combin": [0, 2, 4, 5, 9, 10, 13, 17, 20, 21, 22, 26, 27, 28, 31, 32, 33, 35, 36, 40, 41, 42, 44, 51, 53, 55], "ha": [0, 2, 4, 5, 6, 9, 12, 14, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 38, 41, 50, 54, 55], "tf": [0, 6, 8, 9, 10, 25, 26, 27, 35, 41, 54, 55], "yet": [0, 4, 20, 21, 24, 26, 30, 55], "compat": [0, 2, 5, 10, 20, 21, 22, 24, 30, 33, 36, 41, 42, 55, 56], "export": [0, 5, 30, 32, 40, 55], "follow": [0, 2, 4, 5, 6, 8, 10, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 47, 50, 53, 54, 55], "instruct": [0, 19, 20, 21, 22, 23, 24, 26, 30, 33, 35, 40, 41, 42, 53, 55], "dump_to_tf": [0, 55], "tutori": [0, 55], "ye": [0, 5, 19, 41], "check": [0, 2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 53, 55, 56], "out": [0, 2, 4, 5, 22, 24, 30, 32, 33, 36, 41, 43, 50, 55], "dcn2node": 0, "more": [0, 2, 4, 5, 10, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 38, 39, 40, 41, 43, 50, 54, 55], "detail": [0, 3, 4, 6, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 43, 55, 56], "across": [0, 2, 4, 5, 10, 36, 38, 39, 41, 50, 55], "so": [0, 2, 4, 5, 10, 13, 17, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 40, 41, 45, 50, 55], "have": [0, 2, 4, 5, 9, 10, 18, 20, 21, 24, 26, 30, 35, 36, 40, 41, 42, 49, 50, 53, 54, 55], "veri": [0, 36, 40, 55], "larg": [0, 2, 5, 6, 10, 13, 17, 18, 34, 36, 37, 38, 40, 41, 46, 48, 50, 55, 56], "just": [0, 30, 42, 47, 55], "mani": [0, 5, 30, 55, 56], "That": [0, 36, 55], "why": [0, 36], "name": [0, 2, 4, 5, 9, 12, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 38, 40, 41, 42, 43, 46, 47, 50, 51, 53, 55], "suppos": [0, 2, 41], "1tb": [0, 30, 36, 38, 54, 55], "16xv100": 0, "32gb": [0, 20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 53], "take": [0, 4, 5, 6, 19, 30, 31, 32, 33, 38, 41, 45, 46, 50, 55, 56], "case": [0, 2, 4, 5, 6, 30, 32, 36, 41, 53, 54, 55, 56], "comput": [0, 2, 4, 5, 6, 9, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 40, 41, 50, 55], "0": [0, 2, 4, 5, 6, 8, 9, 10, 13, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 54], "v100": [0, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 35, 38, 40, 41, 42, 43, 51, 53, 54, 55], "t4": [0, 10, 13, 17, 38], "A": [0, 2, 4, 5, 9, 19, 25, 29, 30, 34, 36, 37, 38, 40, 41, 43, 50, 55], "machin": [0, 2, 4, 5, 6, 25, 29, 34, 37, 41, 42, 43, 54, 55, 56], "mandatori": 0, "achiev": [0, 2, 4, 5, 6, 13, 28, 30, 36, 41, 54, 55], "best": [0, 2, 4, 5, 6, 22, 28, 36], "perform": [0, 2, 4, 5, 6, 9, 10, 12, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 33, 34, 35, 36, 37, 41, 55], "exploit": [0, 10], "nvswitch": [0, 2], "inter": [0, 36, 41, 54, 55], "bandwidth": [0, 2, 4, 5, 36, 55], "ucx": [0, 42], "howev": [0, 2, 5, 10, 17, 30, 35, 38, 41, 43, 49, 50, 55], "rdma": [0, 4, 36, 55], "maxim": [0, 5, 30], "transact": [0, 36, 54, 55], "approach": [0, 30, 41], "offload": [0, 5, 55], "workload": [0, 4, 55, 56], "oper": [0, 2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 30, 33, 37, 40, 41, 43, 50, 55], "mainli": 0, "decid": [0, 2, 4], "kind": [0, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 53, 55], "o": [0, 2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 45, 46, 50, 51, 55], "devic": [0, 4, 5, 8, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 47, 50, 51, 53, 54, 55], "dataset": [0, 2, 3, 5, 9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 40, 41, 42, 43, 44, 46, 50, 52, 53, 54, 55], "section": [0, 4, 5, 30, 33, 35, 40, 45, 46, 49, 51, 55], "api": [0, 2, 8, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 36, 37, 41, 43, 46, 47, 50, 53, 55], "document": [0, 2, 4, 5, 15, 18, 19, 26, 27, 30, 33, 35, 36, 39, 41, 43, 55, 56], "introduc": [0, 2, 4, 37, 43, 55], "our": [0, 4, 5, 6, 10, 17, 25, 29, 30, 34, 35, 36, 38, 39, 43, 45, 51, 53, 54, 55], "first": [0, 2, 4, 5, 8, 10, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 45, 46, 47, 48, 50, 51, 55], "version": [0, 2, 4, 5, 6, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 49, 50, 51, 53, 54], "exampl": [0, 2, 4, 5, 8, 9, 15, 19, 25, 29, 30, 34, 35, 36, 38, 40, 41, 44, 50, 54, 55], "hashtabl": [0, 26, 27], "base": [0, 2, 4, 5, 9, 17, 19, 24, 25, 30, 31, 32, 33, 34, 36, 38, 41, 45, 50, 52, 55], "dynam": [0, 2, 4, 5, 23, 33, 38, 41, 55], "insert": [0, 2, 5, 6, 19, 28, 30, 31, 32, 33, 38, 41, 55], "new": [0, 4, 5, 22, 24, 25, 38, 41, 42, 46, 50], "ad": [0, 2, 4, 41, 50, 54, 55], "runtim": [0, 5, 8, 10, 13, 17, 25, 29, 34, 38, 41, 42, 43, 55], "skip": [0, 31, 40, 41, 49, 55], "In": [0, 2, 4, 5, 6, 8, 9, 20, 21, 22, 24, 26, 30, 31, 32, 33, 35, 36, 40, 41, 42, 45, 46, 47, 48, 50, 51, 53, 54, 55, 56], "field": [0, 2, 4, 5, 6, 15, 20, 21, 22, 24, 26, 27, 32, 33, 36, 41, 44, 50], "The": [0, 2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 50, 51, 52, 53, 54, 55], "one": [0, 2, 4, 5, 6, 8, 9, 14, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 41, 43, 54, 55], "hot": [0, 2, 4, 10, 19, 21, 24, 27, 31, 36, 41, 45, 50, 55], "number": [0, 2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 40, 41, 42, 44, 45, 51, 53, 54, 55], "specifi": [0, 2, 4, 5, 8, 9, 10, 12, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 42, 43, 53, 55], "slot_num": [0, 2, 4, 5, 20, 21, 22, 24, 26, 27, 30, 32, 33, 51], "There": [0, 2, 4, 10, 19, 30, 31, 32, 33, 38, 43, 55], "sub": [0, 3, 41, 55], "class": [0, 3, 9, 11, 14, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 40, 46, 50, 55], "thei": [0, 4, 5, 20, 21, 22, 24, 26, 27, 45, 47, 55, 56], "distinguish": [0, 55], "method": [0, 3, 6, 33, 40, 41, 42, 53, 55], "distribut": [0, 2, 4, 5, 8, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 36, 37, 38, 39, 40, 41, 42, 53, 55, 56], "call": [0, 2, 4, 8, 9, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 41, 44, 50, 55], "local": [0, 4, 5, 17, 18, 19, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 42, 43, 49, 53, 55], "mai": [0, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 33, 35, 36, 37, 40, 42, 50, 53, 55], "accord": [0, 2, 4, 5, 24, 30, 31, 32, 33, 36, 55], "index": [0, 2, 4, 9, 12, 15, 24, 26, 27, 30, 31, 32, 33, 36, 42, 49, 51, 53, 55], "regardless": [0, 36, 56], "mean": [0, 2, 4, 5, 9, 19, 21, 22, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 40, 41, 43, 47, 48, 50, 55], "thu": [0, 2, 22, 24, 26, 40, 55], "smaller": [0, 5, 36, 55], "than": [0, 2, 4, 5, 9, 19, 24, 30, 36, 43, 50, 54, 55], "reduct": [0, 2, 9, 22, 36, 38], "per": [0, 2, 4, 5, 6, 31, 34, 41, 45, 55], "global": [0, 4, 5, 8, 9, 20, 21, 22, 24, 26, 27, 31, 32, 33, 36, 40, 41, 42, 50, 51, 53, 55], "reduc": [0, 2, 4, 5, 22, 30, 31, 32, 33, 36, 40, 41, 42, 51, 53, 55], "overal": [0, 5, 36], "much": [0, 36, 55], "less": [0, 4, 30, 36, 55], "made": [0, 2, 55], "some": [0, 2, 4, 5, 23, 24, 30, 35, 41, 43, 46, 48, 55], "larger": [0, 4, 5, 9, 36, 55], "trasact": 0, "iter": [0, 2, 4, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "after": [0, 2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 42, 53], "forward": [0, 2, 4, 5, 6, 9, 12, 17, 28, 30, 32, 38, 41, 55], "kernel": [0, 4, 24, 30, 31, 32, 33, 46, 47, 48, 55], "function": [0, 2, 4, 5, 8, 9, 12, 19, 20, 21, 22, 24, 26, 27, 31, 32, 33, 35, 38, 41, 50, 55, 56], "collect": [0, 3, 4, 10, 13, 17, 19, 30, 38, 50, 55], "commun": [0, 2, 4, 5, 36, 55], "librari": [0, 4, 10, 13, 17, 18, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 39, 41, 48, 50, 55], "nccl": [0, 4, 22, 31, 36, 40, 41, 42, 51, 53, 55], "should": [0, 2, 4, 5, 8, 9, 10, 14, 20, 21, 22, 24, 28, 30, 31, 32, 33, 35, 36, 41, 47, 48, 49, 50, 55], "sourc": [0, 3, 8, 9, 10, 13, 17, 19, 31, 36, 38, 39, 40, 41, 42, 43, 51, 53, 55], "where": [0, 2, 5, 9, 17, 36, 40, 41, 44, 46, 55], "spars": [0, 3, 4, 5, 9, 19, 22, 24, 25, 26, 27, 30, 31, 37, 38, 40, 41, 42, 43, 51, 53, 55], "an": [0, 2, 4, 5, 8, 9, 15, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 35, 36, 37, 38, 39, 41, 42, 43, 46, 47, 50, 53, 55], "arrai": [0, 2, 4, 15, 20, 21, 22, 24, 26, 28, 31, 32, 33, 41, 42, 47, 51, 55], "belong": [0, 4], "last": [0, 2, 4, 5, 9, 20, 21, 22, 26, 33, 41, 47, 48], "second": [0, 2, 4, 5, 21, 23, 28, 30, 33, 55], "element": [0, 2, 4, 51, 55], "below": [0, 2, 4, 6, 15, 19, 25, 29, 30, 34, 35, 43, 48, 49, 51], "top": [0, 2, 4, 26, 27, 32, 33, 54, 55], "data1": [0, 2, 4, 40, 41, 51, 53], "type": [0, 3, 4, 5, 8, 9, 10, 14, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 36, 38, 40, 41, 42, 44, 50, 51, 53, 55], "distributedslot": 0, "max_feature_num_per_sampl": 0, "data2": [0, 40, 41], "binari": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 26, 30, 33, 41, 50, 51, 55], "raw": [0, 2, 3, 23, 24, 28, 30, 31, 32, 33, 38, 41, 44, 50, 51, 55], "snapshot": [0, 4, 31, 40, 41, 42, 51, 53], "json": [0, 2, 4, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 41, 42, 47, 50, 51, 53, 55], "interv": [0, 4, 5, 31, 40, 41, 42, 51, 53], "checkpoint": [0, 30, 47], "prefix": [0, 4, 5, 41], "snapshot_prefix": [0, 2, 4, 31, 40, 41, 42, 53], "modifi": [0, 4, 17, 30, 33, 41, 55], "dense_model_fil": [0, 4, 5, 41], "sparse_model_fil": [0, 4, 5, 41], "solver": [0, 2, 3, 31, 40, 41, 42, 51, 53, 55], "write": [0, 4, 5, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "script": [0, 4, 6, 28, 30, 36, 38, 41, 43, 47, 53, 54, 55], "demonstr": [0, 4, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 41, 43, 44, 52, 55], "uniqu": [0, 2, 4, 5, 51, 55], "preprocess": [0, 4, 30, 40, 43, 54, 55], "e": [0, 4, 5, 6, 9, 10, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 36, 41, 46, 47], "g": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 41, 53], "offset": [0, 2, 4, 27, 55], "hash": [0, 2, 5, 31, 38, 41, 42, 51, 53, 55], "nnz": [0, 4, 21, 22, 26, 31, 41], "look": [0, 4, 5, 9, 19, 30, 41, 45, 49, 50, 55], "up": [0, 2, 4, 5, 9, 21, 24, 25, 28, 29, 30, 31, 33, 34, 36, 40, 41, 42, 50, 51, 53, 54, 55], "firstli": [0, 53], "guid": [0, 4, 22, 24, 30, 31, 32, 33, 38, 55], "secondli": [0, 53], "data_gener": [0, 4, 31, 38, 41, 55], "gener": [0, 2, 3, 5, 6, 14, 19, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 35, 50, 54, 55], "random": [0, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 45, 49, 55], "see": [0, 2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 39, 40, 41, 42, 43, 45, 50, 53, 54, 55], "start": [0, 2, 4, 5, 10, 13, 17, 19, 23, 24, 26, 28, 30, 31, 32, 33, 36, 38, 40, 41, 42, 46, 47, 51, 53, 55], "readm": [0, 40, 41, 55], "thirdli": 0, "huge_ctr": 0, "your_config": 0, "alloc": [0, 4, 5, 26, 30, 31, 32, 33, 40, 41, 42, 55], "accordingli": [0, 33, 55], "necessarili": 0, "exact": [0, 2], "depend": [0, 2, 4, 5, 10, 13, 17, 23, 28, 31, 35, 38, 40, 41, 42, 45, 50, 51, 53, 55], "vocabulari": [0, 2, 21, 31, 40, 42, 51, 53, 55], "workspac": [0, 2, 19, 30, 47, 48, 55], "calcul": [0, 2, 4, 5, 42, 50, 55], "tool": [0, 4, 17, 19, 30, 31, 32, 33, 40, 41, 54, 55], "workspace_s": 0, "usual": [0, 2, 53], "real": [0, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 45, 55], "becaus": [0, 2, 5, 6, 19, 26, 27, 30, 41, 50, 54, 55, 56], "non": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 26, 30, 31, 33, 35, 40, 41, 42, 43, 53, 55], "uniform": [0, 2, 4, 27, 38], "kei": [0, 2, 4, 5, 9, 10, 12, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 36, 38, 40, 41, 46, 47, 51, 53, 55], "argument": [0, 2, 4, 8, 12, 19, 20, 21, 22, 23, 24, 26, 27, 32, 33, 35, 40, 41, 43, 50, 55], "usag": [0, 3, 4, 5, 10, 19, 30, 31, 32, 33, 40, 42, 55], "replac": [0, 5, 6, 17, 20, 21, 22, 24, 26, 30, 31, 32, 33, 55], "avoid": [0, 2, 4, 5, 20, 21, 22, 26, 30, 33, 36, 41, 55], "wast": [0, 2], "caus": [0, 2, 4, 5, 32, 55], "imbalanc": [0, 2], "add": [0, 3, 10, 13, 15, 17, 19, 21, 25, 29, 30, 31, 34, 35, 38, 40, 41, 42, 43, 50, 51, 53, 55], "maximum": [0, 2, 4, 5, 6, 28, 30, 51, 55], "equat": [0, 4], "_size": [0, 4], "_arrai": [0, 4], "k": [0, 2, 4, 47], "max": [0, 4, 5, 19, 21, 22, 23, 26, 28, 30, 31, 32, 33, 41], "limits_i": [0, 4], "k_i": [0, 4], "list": [0, 2, 3, 5, 6, 9, 20, 21, 24, 26, 27, 28, 30, 32, 33, 40, 41, 42, 45, 46, 47, 50, 51, 55], "inform": [0, 2, 4, 5, 10, 19, 23, 24, 28, 35, 36, 38, 39, 40, 41, 46, 50, 53, 54, 55], "about": [0, 3, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 39, 41, 50, 55], "relat": [0, 2, 4, 5, 24, 35, 53, 55], "amount": [0, 5, 40, 55, 56], "localizedslotsparseembeddinghash": [0, 3, 51, 55], "If": [0, 2, 4, 5, 9, 19, 25, 29, 30, 31, 32, 33, 34, 35, 36, 40, 41, 43, 45, 46, 49, 55], "help": [0, 2, 4, 5, 10, 19, 36, 40, 42, 53, 55], "altern": [0, 4, 5, 30, 43, 55], "both": [0, 2, 4, 5, 6, 26, 27, 35, 36, 41, 49, 50, 53, 54, 55], "localizedslotsparseembeddingonehot": [0, 3, 4], "hybridsparseembed": [0, 4], "workspace_size_per_gpu_in_md": 0, "while": [0, 2, 4, 5, 6, 13, 18, 20, 21, 24, 26, 27, 30, 31, 32, 33, 41, 46, 50, 54, 55, 56], "highli": [0, 2, 55], "reli": [0, 4, 5, 19, 35, 41, 55], "pcie": [0, 34], "connect": [0, 2, 4, 5, 21, 22, 23, 24, 25, 26, 29, 30, 33, 34, 38, 41, 42, 43, 55], "insid": [0, 4, 22, 30, 55], "expect": [0, 50, 55], "150gb": 0, "direct": [0, 50], "It": [0, 2, 4, 5, 8, 10, 12, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 36, 38, 40, 41, 43, 50, 55, 56], "3x": [0, 55], "pci": [0, 20, 21, 22, 23, 24, 26, 33, 41], "convert": [0, 6, 10, 17, 20, 21, 22, 24, 38, 44, 51, 52, 54, 55], "facilit": [0, 10, 30, 55], "process": [0, 2, 4, 5, 8, 24, 30, 31, 32, 33, 36, 40, 42, 45, 46, 49, 54, 55, 56], "save_params_to_fil": [0, 3], "familiar": [0, 4], "pre": [0, 5, 10, 25, 52, 53, 55], "hugectr_criteo": 0, "ipynb": [0, 6, 21, 22, 23, 24, 25, 26, 27, 29, 34, 36, 43, 44, 45, 46, 55], "inher": [0, 38], "extra": [0, 4, 46, 47, 48, 55], "abstract": [0, 2, 4, 50, 55], "awai": [0, 2, 50, 55], "slice": [0, 3, 33, 53, 55], "code": [0, 2, 8, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 50, 53, 55, 56], "cooper": 0, "thread": [0, 4, 5, 8, 20, 21, 22, 23, 24, 26, 31, 32, 33, 35, 38, 41, 42, 46, 54, 55], "cta": 0, "launch": [0, 5, 6, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 41, 43, 55], "foremost": 0, "exce": [0, 2, 5, 18, 55], "block": [0, 8, 30, 31, 32, 33, 41, 46, 55], "would": [0, 5, 32, 55], "better": [0, 2, 4, 5, 30, 42, 55], "warp": [0, 55], "sake": [0, 41], "occup": [0, 19], "still": [0, 4, 5, 24, 55], "freeli": 0, "architectur": [0, 10, 13, 17, 18, 20, 28, 36, 38, 47, 50, 55], "long": [0, 4, 5, 10, 32, 41, 55], "compli": 0, "limit": [0, 3, 5, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 53, 55, 56], "share": [0, 2, 5, 17, 30, 35, 41, 53, 55], "rank": [0, 2, 5, 9, 55], "ipc": [0, 19, 43, 47, 48, 55], "pin": [0, 55], "page": [0, 30, 37, 41, 55], "lock": [0, 55], "resourc": [0, 4, 5, 10, 26, 50, 55, 56], "issu": [0, 2, 5, 30, 33, 35], "option": [0, 2, 4, 5, 6, 19, 22, 24, 30, 33, 35, 36, 38, 41, 42, 46, 53, 55], "docker": [0, 5, 10, 13, 17, 19, 34, 35, 38, 41, 47, 48, 53, 55], "command": [0, 6, 10, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 38, 41, 43, 49, 53, 55], "host": [0, 4, 5, 10, 13, 17, 18, 19, 25, 29, 31, 32, 33, 34, 38, 41, 42, 43, 47, 48, 54, 55], "ulimit": [0, 19, 43, 55], "memlock": [0, 19, 43, 55], "stack": [0, 19, 28, 43, 47], "67108864": [0, 19, 43], "leverag": [0, 4, 6, 8, 10, 13, 17, 22, 24, 25, 30, 36, 50, 55], "hirarch": 0, "paramet": [0, 2, 4, 8, 9, 15, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 37, 43, 53, 55, 56], "cach": [0, 4, 6, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 36, 37, 41, 47, 55], "hierarch": [0, 2, 4, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 37, 43, 55], "storag": [0, 4, 5, 10, 13, 17, 18, 20, 28, 30, 31, 32, 33, 36, 40, 41, 42, 55], "encompass": [0, 10, 17], "databas": [0, 4, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 36, 41, 46, 55], "backend": [0, 4, 6, 10, 13, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 35, 36, 41, 47, 53, 55], "updat": [0, 4, 19, 22, 24, 27, 32, 35, 41, 43, 50, 53, 55], "manag": [0, 5, 10, 26, 30, 31, 32, 33, 41, 46, 55], "exhaust": [0, 5, 55], "constantli": [0, 10], "trigger": [0, 5, 8, 22, 33, 36, 55], "thi": [0, 2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56], "messag": [0, 5, 19, 33, 35, 41, 42, 55], "scenario": [0, 36, 55, 56], "either": [0, 4, 5, 9, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 53], "enforc": [0, 50], "mode": [0, 2, 4, 5, 6, 10, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 51, 53, 55], "hit_rate_threshold": [0, 4, 5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "extend": [0, 2, 5, 10, 21, 22, 26, 27, 55], "enough": [0, 2, 55], "number_of_worker_buffers_in_pool": [0, 4, 5], "pleas": [0, 2, 4, 5, 6, 10, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 46, 53, 55, 56], "hp": [0, 4, 18, 25, 27, 29, 36, 43, 55], "talk": [1, 55], "blog": [1, 54, 55], "question": [1, 35], "answer": 1, "contribut": [1, 55], "hugectr": [1, 5, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 44, 50, 52, 55], "differ": [2, 4, 5, 10, 17, 18, 19, 22, 23, 28, 31, 33, 34, 35, 36, 40, 41, 45, 55], "correspond": [2, 4, 5, 9, 36, 41, 50, 55], "python": [2, 3, 5, 10, 13, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 37, 38, 41, 42, 43, 49, 51, 53, 55, 56], "descript": [2, 15, 40, 42, 44, 55], "each": [2, 4, 5, 8, 9, 10, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 34, 36, 38, 40, 41, 42, 43, 50, 51, 53, 54, 55], "includ": [2, 4, 5, 10, 17, 18, 19, 36, 38, 41, 44, 45, 46, 55], "its": [2, 4, 5, 6, 9, 20, 21, 22, 24, 25, 29, 30, 33, 34, 36, 38, 43, 46, 55], "data": [2, 3, 5, 6, 9, 14, 19, 20, 21, 22, 24, 26, 27, 32, 33, 35, 36, 43, 45, 47, 50, 51, 52, 54, 55, 56], "model": [2, 3, 8, 9, 10, 12, 13, 15, 17, 18, 19, 23, 24, 25, 28, 34, 35, 37, 38, 41, 43, 44, 47, 50, 52, 54, 55, 56], "instanc": [2, 4, 5, 6, 9, 30, 33, 36, 46, 47, 48, 55, 56], "sparseembed": [2, 4, 31, 41, 42, 51, 53, 55], "denselay": [2, 4, 31, 40, 41, 42, 51, 53, 55], "can": [2, 4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 43, 44, 45, 46, 50, 53, 54, 55, 56], "access": [2, 5, 10, 13, 17, 18, 25, 29, 30, 31, 34, 40, 41, 42, 43, 51, 53, 55], "label_dim": [2, 4, 5, 31, 40, 41, 42, 51, 53, 55], "integ": [2, 4, 5, 12, 38, 50, 54], "label": [2, 4, 9, 20, 21, 22, 24, 26, 27, 31, 32, 33, 35, 38, 40, 41, 42, 50, 51, 53, 54, 55], "dimens": [2, 4, 9, 20, 21, 22, 24, 26, 27, 32, 33, 55], "1": [2, 4, 5, 6, 8, 9, 10, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53], "impli": [2, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "i": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56], "For": [2, 4, 5, 6, 9, 10, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 50, 54, 55], "item": [2, 4, 44, 46, 47, 48, 53, 54, 55], "click": [2, 36, 37, 38, 39, 54, 55], "NO": [2, 4, 19, 41], "default": [2, 4, 5, 9, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 38, 40, 41, 43, 54, 55], "valu": [2, 4, 5, 8, 9, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 40, 41, 47, 48, 49, 51, 55], "user": [2, 4, 5, 10, 13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 38, 40, 42, 44, 45, 50, 51, 53, 54, 55], "label_nam": [2, 4, 31, 40, 41, 42, 51, 53], "string": [2, 4, 5, 8, 9, 12, 15, 31, 41, 45, 50, 55], "tensor": [2, 4, 9, 12, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53, 55], "referenc": [2, 10, 38], "dense_dim": [2, 4, 22, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "continu": [2, 4, 5, 30, 43, 46, 50, 55], "featur": [2, 4, 5, 9, 20, 21, 22, 24, 25, 26, 27, 30, 31, 32, 33, 35, 38, 40, 41, 42, 44, 45, 46, 50, 52, 53, 54, 55], "set": [2, 4, 5, 8, 17, 20, 21, 23, 25, 26, 29, 30, 33, 34, 36, 38, 40, 41, 43, 46, 47, 50, 53, 54, 55], "dense_nam": [2, 4, 31, 40, 41, 42, 51, 53], "data_reader_sparse_param_arrai": [2, 4, 31, 40, 41, 42, 51, 53], "datareadersparseparam": [2, 4, 31, 40, 41, 42, 51, 53], "categor": [2, 4, 30, 38, 44, 45, 50, 51, 54, 55], "construct": [2, 4, 41, 50, 55], "sparse_nam": 2, "nnz_per_slot": [2, 51, 55], "is_fixed_length": [2, 51, 55], "reader": [2, 4, 31, 35, 38, 40, 41, 42, 51, 53, 55], "int": [2, 4, 5, 8, 9, 27, 28, 30, 31, 32, 33, 41, 42, 51, 55], "which": [2, 4, 5, 6, 8, 9, 12, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 43, 50, 54, 55, 56], "appli": [2, 4, 5, 13, 19, 20, 24, 25, 28, 30, 35, 36, 40, 50, 54, 55], "everi": [2, 4, 32, 55], "slot": [2, 4, 5, 21, 22, 26, 36, 38, 41, 42, 55], "could": [2, 5, 22, 24, 30, 33, 41, 55], "conveni": [2, 10, 13, 17, 19, 25, 29, 34, 38, 43, 55], "all": [2, 4, 5, 6, 8, 9, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 50, 51, 53, 54, 55, 56], "same": [2, 4, 5, 6, 9, 12, 17, 20, 21, 23, 24, 25, 26, 28, 30, 32, 33, 36, 50, 54, 55], "Or": 2, "initi": [2, 4, 5, 7, 9, 12, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 36, 38, 41, 42, 43, 50, 55], "when": [2, 4, 5, 8, 10, 14, 15, 17, 21, 22, 24, 25, 27, 28, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 43, 50, 53, 55], "length": [2, 4, 5, 24, 27, 41], "ident": [2, 5, 24, 30, 33, 55], "note": [2, 4, 5, 9, 19, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 36, 40, 41, 43, 46, 47, 48, 51, 53], "rawasync": [2, 4, 55], "onli": [2, 4, 5, 8, 10, 20, 22, 24, 30, 31, 32, 33, 35, 36, 38, 40, 41, 50, 51, 54, 55, 56], "static": [2, 4, 5, 19, 28, 30, 31, 32, 41, 55], "support": [2, 4, 5, 9, 10, 13, 15, 17, 19, 20, 21, 22, 24, 26, 28, 30, 31, 32, 33, 35, 38, 40, 41, 48, 50, 51, 53, 55, 56], "impact": [2, 55], "parquet": [2, 3, 31, 38, 40, 41, 42, 45, 49, 50, 51, 53, 55], "identifi": [2, 38, 47, 55], "whether": [2, 4, 5, 41, 56], "among": [2, 4, 36, 56], "sampl": [2, 4, 5, 6, 10, 13, 17, 28, 30, 31, 35, 36, 38, 40, 41, 42, 55], "true": [2, 4, 5, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 42, 46, 47, 48, 51, 53, 55], "transfer": [2, 10, 41, 55], "time": [2, 5, 8, 17, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 44, 45, 46, 50, 51, 53, 54, 55], "13": [2, 4, 6, 21, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53, 54, 55], "26": [2, 4, 5, 6, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 47, 51, 53, 54], "wide_data": [2, 4, 42], "2": [2, 4, 5, 6, 8, 9, 10, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 40, 42, 45, 47, 49, 50, 51, 53], "deep_data": [2, 4, 42], "One": 2, "sever": [2, 4, 5, 10, 19, 20, 21, 22, 23, 24, 30, 36, 40, 44, 52, 55], "befor": [2, 4, 5, 8, 9, 10, 21, 22, 23, 24, 26, 27, 35, 38, 40, 41, 42, 43, 47, 53, 55], "embedding_typ": [2, 4, 31, 41, 42, 51, 53], "embedding_t": [2, 4, 28, 31, 41, 42, 51, 53], "doe": [2, 4, 5, 19, 22, 25, 26, 29, 30, 31, 32, 33, 34, 43, 55], "must": [2, 4, 5, 8, 9, 14, 17, 27, 30, 33, 36, 55], "workspace_size_per_gpu_in_mb": [2, 4, 31, 41, 42, 51, 53, 55], "memori": [2, 4, 5, 10, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 36, 40, 41, 42, 43, 50, 55, 56], "size": [2, 4, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 36, 40, 41, 42, 46, 50, 51, 53, 54, 55], "megabyt": 2, "gpu": [2, 4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 48, 50, 51, 53, 54, 55, 56], "big": 2, "hold": [2, 5], "state": [2, 4, 5, 24, 31, 35, 36, 41, 42, 48, 50, 51, 53, 55], "dure": [2, 4, 5, 20, 21, 24, 26, 27, 30, 36, 38, 55], "train": [2, 3, 10, 17, 18, 19, 23, 25, 34, 37, 38, 39, 43, 47, 50, 52, 54, 55, 56], "evalu": [2, 3, 5, 8, 20, 21, 24, 26, 31, 40, 41, 42, 50, 51, 53, 55], "To": [2, 4, 5, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 33, 34, 35, 36, 38, 40, 41, 42, 43, 53, 55], "understand": [2, 55], "how": [2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 40, 41, 43, 50, 52, 55], "slot_size_arrai": [2, 4, 31, 40, 41, 42, 51, 53, 55], "embedding_vec_s": [2, 4, 20, 21, 22, 23, 24, 26, 28, 31, 32, 33, 41, 42, 51, 53], "vector": [2, 4, 5, 9, 10, 12, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 38, 55], "intra": [2, 36, 54], "sum": [2, 4, 9, 21, 40, 41, 42, 51, 53, 55], "sparse_embedding_nam": [2, 4, 31, 41, 42, 51, 53], "bottom_nam": [2, 4, 31, 40, 41, 42, 51, 53], "bottom": [2, 26, 27, 32, 33, 55], "consum": [2, 5, 55, 56], "predefin": 2, "from": [2, 4, 5, 9, 10, 13, 14, 17, 18, 19, 25, 29, 31, 32, 33, 36, 40, 42, 43, 44, 45, 48, 49, 50, 51, 53, 54, 55], "consist": [2, 4, 5, 10, 13, 15, 17, 24, 30, 38, 40, 41, 50, 55], "optparamspi": [2, 3], "dedic": [2, 10, 17, 36, 37, 38, 55, 56], "do": [2, 4, 5, 13, 19, 20, 21, 24, 26, 35, 36, 40, 43, 46, 53, 55], "adopt": [2, 4, 55], "store": [2, 4, 5, 6, 9, 10, 20, 22, 24, 30, 31, 32, 33, 36, 40, 41, 43, 44, 45, 46, 52, 53, 55], "tabl": [2, 4, 5, 6, 9, 10, 12, 13, 15, 17, 18, 20, 22, 24, 25, 26, 27, 29, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 51, 53, 55, 56], "get": [2, 4, 14, 36, 40, 41, 42, 46, 48, 55], "indic": [2, 4, 5, 9, 20, 21, 22, 24, 26, 30, 32, 33, 38, 55], "segment": [2, 24, 55], "multipl": [2, 4, 5, 8, 9, 10, 20, 22, 24, 25, 26, 35, 36, 38, 39, 41, 50, 55, 56], "span": 2, "node": [2, 4, 5, 14, 17, 24, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 43, 51, 53, 54, 55], "With": [2, 5, 25, 29, 34, 36, 55, 56], "portion": [2, 24], "": [2, 4, 5, 10, 13, 17, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 33, 34, 36, 37, 38, 40, 41, 42, 43, 44, 46, 47, 50, 51], "exist": [2, 5, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 41, 42, 45, 46, 50, 55, 56], "load": [2, 4, 5, 10, 17, 19, 20, 21, 23, 24, 25, 26, 27, 30, 31, 32, 33, 36, 38, 41, 45, 46, 47, 48, 49, 53, 55], "imbal": [2, 55], "oom": 2, "import": [2, 8, 9, 10, 13, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 55], "singl": [2, 4, 36, 40, 41, 42, 50, 54, 55, 56], "assum": [2, 4, 5, 9, 30, 38, 41, 55], "repres": [2, 9, 19, 22, 26, 40, 50], "id": [2, 4, 5, 9, 20, 21, 22, 23, 24, 25, 26, 29, 30, 33, 34, 35, 40, 41, 44], "ar": [2, 4, 5, 6, 9, 10, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 55, 56], "map": [2, 4, 5, 20, 21, 22, 23, 24, 26, 28, 31, 32, 33, 40, 41, 42, 51, 53, 55], "input_key_typ": [2, 4], "By": [2, 5, 13, 35, 36, 43, 50, 55], "32": [2, 4, 5, 6, 8, 21, 23, 25, 29, 30, 32, 33, 34, 40, 41, 42, 43, 46, 47, 51, 53, 55], "bit": [2, 5, 38, 41, 55], "i32": [2, 4], "64": [2, 4, 5, 6, 8, 21, 23, 34, 38, 41, 47], "i64": [2, 4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "allow": [2, 4, 5, 10, 13, 17, 25, 29, 30, 34, 36, 38, 41, 43, 46, 47, 48, 50, 55], "even": [2, 5, 36, 37, 55], "constrain": 2, "addit": [2, 4, 5, 30, 35, 36, 45, 50, 55], "overflow": [2, 31, 32, 33, 55], "verifi": [2, 4, 25, 29, 34, 43, 55], "beyond": [2, 5], "neg": [2, 55], "confid": 2, "disabl": [2, 5, 30, 31, 33, 35, 48, 55], "environ": [2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 38, 40, 41, 42, 43, 53, 54, 55], "variabl": [2, 4, 17, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 41, 53, 55], "hugectr_disable_overflow_check": [2, 55], "23": [2, 4, 6, 10, 17, 23, 24, 25, 30, 32, 33, 34, 40, 41, 42, 47, 48, 53], "sparse_embedding1": [2, 4, 5, 8, 20, 21, 24, 30, 31, 40, 41, 42, 51, 53], "input_data": [2, 42], "unlik": [2, 5, 54], "individu": [2, 4], "locat": [2, 5, 35, 36, 38, 41, 43, 53, 55, 56], "scalabl": [2, 10, 18, 36, 54, 55], "avail": [2, 4, 5, 8, 10, 13, 17, 18, 20, 21, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 36, 38, 39, 40, 41, 42, 43, 46, 49, 54, 55, 56], "togeth": [2, 4, 35, 39, 41, 43, 55], "format": [2, 3, 5, 6, 10, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 38, 40, 41, 42, 45, 50, 51, 54, 55], "other": [2, 4, 5, 8, 9, 10, 18, 20, 21, 22, 23, 24, 26, 30, 32, 33, 35, 36, 41, 43, 44, 50, 54, 55], "equip": [2, 5, 30], "dgx": [2, 40], "a100": [2, 6, 10, 13, 17, 19, 34, 35, 38, 43, 48], "1221": 2, "754": [2, 40], "8": [2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 38, 40, 41, 42, 47, 48, 49, 53], "4": [2, 4, 5, 6, 10, 20, 21, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 38, 40, 42, 45, 47, 49, 50, 51, 53, 54], "12": [2, 4, 6, 20, 21, 23, 24, 26, 28, 31, 32, 33, 40, 41, 42, 47, 51, 53], "49": [2, 20, 23, 32, 33, 40, 41, 42, 47, 51], "128": [2, 4, 5, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 47, 50, 51, 53], "loss": [2, 4, 20, 21, 22, 24, 26, 27, 31, 32, 33, 36, 40, 41, 42, 51, 53, 54, 55], "final": [2, 4, 43, 49, 55], "fuse": [2, 5, 23, 25, 28, 30, 33, 41, 55], "util": [2, 4, 5, 10, 13, 19, 20, 21, 22, 24, 25, 26, 30, 31, 32, 33, 36, 38, 40, 41, 43, 45, 55, 56], "layer_typ": [2, 4, 31, 40, 41, 42, 51, 53], "layer_t": [2, 4, 31, 40, 41, 42, 51, 53, 55], "cast": [2, 31, 32, 33], "innerproduct": [2, 4, 40, 41, 42, 51, 53], "prelu_dic": 2, "str": [2, 4, 5, 8, 9, 20, 21, 22, 23, 24, 26, 27, 28, 32, 33, 40, 42, 49, 51, 55], "top_nam": [2, 4, 31, 40, 41, 42, 51, 53], "output": [2, 4, 6, 9, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 40, 41, 42, 43, 46, 48, 51, 53, 55], "num_output": [2, 4, 31, 40, 41, 42, 51, 53], "weight_init_typ": 2, "weight": [2, 4, 6, 9, 10, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 36, 38, 41, 42, 51, 53, 55], "initializer_t": 2, "xaviernorm": 2, "xavieruniform": 2, "zero": [2, 4, 5, 20, 21, 22, 23, 24, 26, 28, 36, 41, 49, 51, 55], "bias_init_typ": 2, "bia": [2, 32, 47, 55], "shape": [2, 4, 6, 9, 14, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 47, 49, 51, 53, 55], "batch_siz": [2, 14, 21, 22, 26, 27, 30, 31, 32, 33, 41, 55], "ani": [2, 4, 5, 8, 10, 20, 21, 22, 23, 24, 26, 27, 28, 32, 35, 36, 40, 41, 42, 53, 55], "relu1": [2, 40, 41, 42, 51, 53], "fc2": [2, 22, 30, 40, 41, 42, 51, 53], "1024": [2, 4, 5, 6, 19, 21, 22, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 47, 48, 49, 51, 53, 54], "relu2": [2, 40, 42, 51, 53], "compris": [2, 4, 30, 31, 32, 33, 34, 48, 51], "fulli": [2, 5, 23, 31, 34, 36, 38, 40, 41, 42, 51, 53, 55, 56], "fp16": [2, 6, 24, 30, 36, 55], "fp32": [2, 4, 6, 24, 31, 32, 33, 55], "tf32": [2, 30, 33, 55], "act_typ": [2, 31], "activ": [2, 4, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 54, 55], "activation_t": [2, 31], "use_bia": [2, 31], "boolean": [2, 4, 5], "overrid": [2, 4, 26, 53], "bias": 2, "compute_config": 2, "denselayercomputeconfig": [2, 55], "configur": [2, 4, 6, 8, 9, 10, 12, 13, 15, 17, 18, 19, 23, 28, 35, 36, 38, 40, 41, 51, 53, 55], "valid": [2, 4, 5, 35, 42, 50, 51, 53, 55], "flag": [2, 5, 20, 21, 22, 23, 24, 26, 30, 33, 41, 55], "async_wgrad": [2, 55], "fuse_wb": [2, 55], "wgrad": [2, 55], "asynchron": [2, 4, 5, 19, 38, 55], "dgrad": 2, "fals": [2, 4, 5, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 42, 46, 47, 50, 51, 53, 55], "bgrad": 2, "compute_config_bottom": 2, "compute_config_top": 2, "mlp1": [2, 31], "512": [2, 4, 5, 24, 25, 29, 30, 31, 32, 33, 34, 40, 43, 47, 50, 51, 53], "256": [2, 4, 5, 6, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 47, 53, 55], "interaction1": [2, 31, 40, 53], "interaction_grad": 2, "mlp2": [2, 31], "cross": [2, 35, 38, 40, 41, 42, 53, 54, 55], "network": [2, 4, 5, 14, 17, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 43, 44, 47, 50, 51, 53, 54, 55], "explicit": [2, 19, 24, 30, 31, 32, 33], "two": [2, 4, 5, 10, 18, 19, 21, 24, 27, 30, 35, 36, 40, 50, 51, 53, 55], "invent": 2, "v1": [2, 20, 21, 22, 24, 30, 33, 35, 53, 54], "respect": [2, 4, 5, 10, 55], "n": [2, 5, 9, 24, 26, 30, 31, 32, 33, 40, 41, 42, 47, 50], "mathemat": 2, "formula": [2, 55], "those": [2, 4, 30, 55], "x_": 2, "l": [2, 26, 27, 46, 53], "x": [2, 4, 6, 8, 9, 26, 27, 32, 33, 34, 41, 42, 49, 53], "t": [2, 19, 24, 30, 35, 36, 42, 47, 50, 55], "_": [2, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 40, 42], "w_": 2, "b_l": 2, "x_l": 2, "w_l": 2, "mathbb": 2, "r": [2, 26, 27, 30, 47, 53], "times1": 2, "learnabl": 2, "x_0": 2, "odot": 2, "mathbf": 2, "w": [2, 19, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 41, 43, 55], "elementwis": 2, "dot": 2, "_l": 2, "decreas": [2, 5], "complex": [2, 5, 38, 50], "approxim": [2, 5], "factor": [2, 55], "lower": [2, 5, 35, 38], "matric": 2, "u": [2, 5, 6, 19, 25, 29, 30, 34, 35, 41, 43, 53, 55], "v": [2, 25, 29, 30, 34, 43, 47, 48, 55], "project": [2, 4, 10, 17, 18, 38, 39, 55], "correspondingli": [2, 4, 8, 24], "evolv": 2, "num_lay": [2, 30, 53], "posit": [2, 4, 55], "projection_dim": 2, "degrad": [2, 5, 55], "slice11": [2, 53], "multicross1": [2, 53], "6": [2, 4, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 36, 38, 40, 41, 42, 47, 50, 53], "thefmorder2": 2, "order": [2, 4, 5, 9, 20, 21, 22, 24, 26, 30, 31, 32, 33, 41, 50, 55], "fm": 2, "linear": [2, 32, 47, 54], "pairwis": 2, "product": [2, 5, 10, 19], "latent": 2, "out_dim": [2, 26, 27], "slice32": 2, "10": [2, 4, 5, 6, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 46, 47, 51, 53, 55], "multipli": [2, 9, 47, 55], "space": [2, 5, 30, 42], "weight_dim": 2, "matrix": [2, 4, 9, 36, 51], "slot_dim": 2, "vec_dim": 2, "correctli": [2, 4, 36, 41, 55], "emploi": [2, 4, 5, 28, 30, 31, 32, 33, 55], "result": [2, 4, 5, 9, 24, 28, 30, 31, 32, 33, 35, 36, 41, 50, 54, 55], "wise": [2, 55], "none": [2, 9, 20, 21, 22, 23, 24, 26, 27, 30, 33, 41, 42, 48, 51, 53, 55], "2x": [2, 24], "num_elem": 2, "slice1": 2, "slice2": 2, "eltmultiply1": 2, "implement": [2, 4, 5, 24, 33, 35, 36, 38, 41, 50, 55], "cudnn": [2, 30, 31, 32, 33, 47, 55], "batch": [2, 4, 5, 6, 8, 9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 38, 41, 47, 54, 55], "normal": [2, 40, 41, 42, 50], "float": [2, 4, 5, 9, 30, 32, 33, 47, 48], "exponenti": 2, "averag": [2, 4, 5, 30, 34, 35, 48, 55], "runningmean": 2, "newmean": 2, "ep": [2, 47], "epsilon": [2, 4, 31, 42], "1e": [2, 4, 28, 41, 47, 50], "5": [2, 4, 5, 6, 8, 9, 10, 13, 17, 20, 21, 22, 23, 24, 26, 28, 32, 33, 36, 38, 40, 42, 45, 46, 47, 49, 50, 51, 53], "gamma_init_typ": 2, "gamma": 2, "beta_init_typ": 2, "beta": [2, 4, 32], "00001": [2, 24], "varianc": 2, "file": [2, 3, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 35, 36, 38, 40, 41, 42, 43, 45, 46, 47, 50, 51, 54, 55], "my_snapshot_dense_5000": 2, "find": [2, 4, 5, 30, 35, 38, 50, 54, 55], "norm": [2, 4, 9, 38, 55], "shown": [2, 4, 5, 6, 8, 10, 17, 54], "192325": 2, "003050": 2, "323447": 2, "034817": 2, "091861": 2, "var": [2, 31, 32, 33], "738942": 2, "410794": 2, "370279": 2, "156337": 2, "638146": 2, "759954": 2, "251507": 2, "648882": 2, "176316": 2, "515163": 2, "434012": 2, "422724": 2, "001451": 2, "756962": 2, "126412": 2, "851878": 2, "837513": 2, "694674": 2, "791046": 2, "849544": 2, "694500": 2, "405566": 2, "211646": 2, "936811": 2, "659098": 2, "2d": [2, 55], "3d": [2, 55], "seq_len": 2, "4d": [2, 55], "num_attention_head": 2, "concaten": [2, 20, 21, 24, 26, 27, 28, 30, 32, 33, 38, 51, 55], "axi": [2, 6, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 42, 45, 48, 55], "dimension": [2, 38, 55], "num_feas_0": 2, "num_elems_0": 2, "num_fea": [2, 26, 27, 32, 33, 55], "num_elems_1": 2, "num_feas_1": 2, "reshape3": 2, "weight_multiply2": 2, "concat2": [2, 26, 27, 33, 53], "leading_dim": [2, 41, 42, 51, 53], "innermost": 2, "total": [2, 4, 5, 9, 10, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 41, 42, 46, 50, 51], "unspecifi": [2, 41], "n_slot": 2, "time_step": 2, "defin": [2, 5, 15, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 42, 45, 53], "selected_slot": 2, "ignor": [2, 4, 30, 32, 33, 41, 42, 53], "destin": [2, 55], "placehold": [2, 17, 24, 30, 31, 32, 33], "cannot": [2, 5, 9, 10, 31, 35, 38, 40, 41, 42, 47, 51, 53, 56], "deprec": [2, 4, 5, 41, 43, 55], "futur": [2, 4, 5, 20, 21, 22, 26, 28, 35, 41, 55], "restrict": [2, 4, 10, 35, 55], "tailing_dim": 2, "reshape1": [2, 26, 33, 41, 42, 51, 53], "416": [2, 32, 41, 42, 53], "dim": [2, 24, 30, 31, 32, 33, 47], "select1": 2, "selct": 2, "extract": [2, 10, 20, 21, 22, 24, 32, 33, 44, 49, 51, 52], "rang": [2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 46, 47, 49, 53, 55], "tupl": [2, 27], "creat": [2, 4, 5, 6, 10, 22, 28, 31, 32, 33, 35, 40, 41, 42, 43, 44, 45, 46, 47, 50, 52, 53, 55], "inclus": 2, "end": [2, 4, 5, 18, 19, 23, 24, 28, 30, 31, 36, 40, 41, 51, 53, 55], "exclus": [2, 19, 30, 55], "overlap": [2, 4, 5, 23, 28, 54, 55], "unless": [2, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 43, 53], "revers": 2, "along": [2, 4, 9, 55], "b": [2, 4, 24, 30, 41], "d": [2, 4, 30, 32, 40, 41, 42, 46, 47, 49, 51, 55], "c": [2, 10, 18, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 50, 55], "len": [2, 21, 22, 23, 26, 27, 28, 30, 32, 40, 41, 42, 46, 47, 49, 51], "actual": [2, 4, 5, 20, 21, 22, 24, 26, 36, 55], "explicitli": [2, 8, 24, 55], "slice21": 2, "slice22": 2, "weight_multiply1": 2, "3": [2, 4, 5, 6, 8, 9, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 37, 38, 40, 42, 45, 47, 49, 50, 51, 53, 54], "copi": [2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 40, 42, 46, 53, 55], "branch": [2, 35, 55], "topologi": [2, 4, 10, 55], "graph": [2, 4, 5, 6, 10, 14, 17, 22, 23, 27, 28, 36, 40, 41, 42, 50, 51, 53, 55], "parser": [2, 30, 31, 32, 33, 40, 42, 55], "intern": [2, 4, 8, 24, 26, 41, 55], "handl": [2, 4, 5, 17, 30, 31, 32, 33, 41, 50, 55], "situat": [2, 5, 41, 55], "behav": 2, "abov": [2, 4, 5, 10, 19, 24, 25, 29, 30, 34, 38, 43], "whilst": 2, "simplifi": [2, 50, 55], "randomli": 2, "zeroiz": 2, "drop": [2, 45, 55], "dropout_r": [2, 42, 53], "rate": [2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 37, 38, 39, 41, 45, 50, 51, 55], "between": [2, 4, 5, 18, 30, 34, 36, 40, 41, 50, 55], "dropout1": [2, 42, 53], "unit": [2, 4, 20, 21, 22, 23, 24, 26, 27, 33, 35, 54, 55], "elu_alpha": 2, "scalar": [2, 55], "satur": 2, "fc1": [2, 4, 22, 30, 40, 41, 42, 51, 53], "elu1": 2, "rectifi": 2, "sigmoid1": 2, "NOT": [2, 24, 53], "captur": 2, "typic": [2, 4, 5, 9], "output_dim": 2, "layer1": [2, 47], "layer3": [2, 47], "arbitrari": [2, 9, 36, 55], "manner": [2, 4, 5, 8, 10, 35, 43, 55], "nx": [2, 54], "fc4": [2, 40, 53], "reducesum1": 2, "reducesum2": 2, "remain": [2, 10, 13, 17, 38, 55], "gate": 2, "recurr": 2, "batchsiz": [2, 4, 20, 21, 22, 24, 26, 27, 31, 32, 33, 40, 41, 42, 47, 51, 53], "seqlength": 2, "sequenc": [2, 4, 20, 21, 26, 55], "vector_s": 2, "gru1": 2, "conncat1": 2, "20": [2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 32, 33, 40, 41, 47, 49, 51, 53, 54], "parametr": 2, "adapt": [2, 41], "adjust": [2, 5, 30, 55], "point": [2, 27], "prelu": 2, "dice": 2, "fc_din_i1": 2, "dice_1": 2, "specif": [2, 4, 5, 18, 20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 42, 44, 50, 53, 55], "item1": 2, "scale_item": 2, "sparse_embedding_good": 2, "sparse_embedding_c": 2, "fusedreshapeconcat_item_his_em": 2, "fusedreshapeconcat_item": 2, "accept": [2, 4, 14, 40, 41], "need": [2, 4, 5, 10, 13, 18, 19, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 38, 40, 41, 46, 50, 51, 53, 55], "mask": [2, 26, 27, 55], "10000": [2, 4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 42], "step": [2, 4, 5, 6, 8, 10, 20, 21, 22, 23, 24, 26, 27, 31, 32, 33, 34, 35, 36, 40, 41, 50, 53, 55], "softmax_i": 2, "y": [2, 6, 32, 50], "produc": [2, 4, 22, 26, 30, 55], "scale_item1": 2, "item_his1": 2, "sub_ih": 2, "reducemean1": 2, "mutipl": 2, "m": [2, 5, 6, 9, 19, 30, 33, 40, 41, 47, 49, 50, 55], "h": [2, 19, 30, 33, 41], "matrixmutiply1": 2, "text": [2, 4, 24, 43, 44, 49, 50, 51, 52], "cdot": 2, "q": [2, 20, 21, 22, 23, 24, 28, 32, 33, 35, 51], "inner": 2, "pad": [2, 4, 47], "due": [2, 15, 22, 33, 55], "inequ": 2, "attent": [2, 55], "head": [2, 35, 42, 45, 46, 47, 49, 50, 51, 55], "seq_from": 2, "hidden_dim": 2, "seq_to": 2, "queri": [2, 5, 10, 19, 38, 41, 55], "attention_out": 2, "mark": 2, "make": [2, 4, 5, 10, 19, 20, 21, 25, 26, 27, 30, 35, 36, 38, 40, 41, 42, 43, 44, 48, 50, 51, 53, 55], "sure": [2, 5, 19, 30, 35, 36, 41, 42, 50, 53, 55], "max_sequence_len_from": 2, "max_sequence_len_to": 2, "sequence_mask": 2, "eight": [2, 54], "num_indic": 2, "gather1": 2, "predict": [2, 3, 5, 31, 32, 33, 41, 50, 51, 55], "use_regular": 2, "regulari": 2, "THe": 2, "regularizer_typ": 2, "regular": [2, 5, 30, 55], "regularizer_t": 2, "l1": 2, "l2": [2, 9], "lambda": [2, 20, 21, 22, 24, 30, 33, 50], "term": [2, 4, 55], "use_regulari": 2, "propag": [2, 4, 5, 17, 41, 55], "phase": [2, 55], "backward": [2, 4, 32, 55], "v3": [2, 55], "7": [2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 26, 28, 30, 32, 33, 37, 38, 40, 41, 42, 47, 53, 54], "releas": [2, 4, 19, 24, 30, 33, 35, 41, 43, 50, 53, 54], "enabl": [2, 4, 5, 6, 10, 13, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 51, 53, 55], "placement": [2, 5, 55], "strategi": [2, 8, 19, 22, 25, 55], "compar": [2, 5, 6, 28, 41, 54, 55], "three": [2, 4, 5, 6, 18, 19, 30, 34, 35, 38, 54, 55], "advantag": [2, 5, 55, 56], "previou": [2, 5, 24, 51, 55], "enhanc": [2, 54, 55], "boost": [2, 36, 55], "flexibl": [2, 18, 55], "lookup": [2, 6, 9, 10, 12, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 36, 38, 55], "parallel": [2, 4, 5, 10, 38, 40, 46, 55, 56], "object": [2, 4, 5, 20, 21, 22, 24, 30, 33, 41, 42, 50, 55], "max_vocabulary_s": [2, 20, 22, 24, 26, 27, 32, 33, 40], "ev_siz": [2, 40], "config": [2, 8, 19, 23, 24, 26, 27, 30, 31, 32, 33, 35, 40, 41, 53, 55], "organ": [2, 4], "nccl_launch_mod": 2, "group": [2, 4, 5, 30, 35, 50, 55], "potenti": [2, 44, 55], "hang": [2, 55], "mix": [2, 4, 5, 24, 31, 40, 41, 42, 51, 53, 55, 56], "precis": [2, 4, 5, 24, 31, 40, 41, 42, 51, 53, 55], "attribut": [2, 15, 41], "dump": [2, 4, 23, 26, 27, 28, 31, 36, 41, 42, 46, 47, 48, 51, 53, 55], "contain": [2, 4, 5, 6, 8, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 36, 41, 43, 44, 45, 46, 47, 48, 50, 53, 54, 55], "incorrectli": [2, 55], "receiv": [2, 5, 10, 22, 26], "error": [2, 4, 5, 24, 30, 31, 33, 35, 41, 46, 47, 55], "know": [2, 5, 19, 55], "opt_param": [2, 4], "greater": [2, 4, 5, 19, 55], "sgd": [2, 4, 40, 53, 55], "adagrad": [2, 4, 55], "momentumsgd": [2, 4], "nesterov": [2, 4, 55], "rmsprop": 2, "adam": [2, 4, 20, 21, 22, 24, 27, 31, 32, 33, 41, 42, 51, 54, 55], "ftrl": [2, 4, 55], "203931": [2, 40], "18598": [2, 40], "14092": [2, 40], "7012": [2, 40], "18977": [2, 40], "6385": [2, 40], "1245": [2, 40], "186213": [2, 40], "71328": [2, 40], "67288": [2, 40], "11": [2, 6, 23, 24, 28, 30, 31, 32, 33, 40, 41, 42, 47, 48, 51, 53], "2168": [2, 40], "7338": [2, 40], "61": [2, 23, 40, 42, 47], "932": [2, 31, 40], "15": [2, 5, 8, 23, 30, 32, 33, 40, 41, 42, 47, 51, 53, 55], "204515": [2, 40], "141526": [2, 40], "199433": [2, 40], "60919": [2, 40], "9137": [2, 40], "71": [2, 23, 26, 40, 47], "34": [2, 23, 32, 33, 40, 41, 42, 47, 51, 53], "embedding_table_list": [2, 40], "append": [2, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 46, 47], "table_": 2, "use_exclusive_kei": [2, 40], "bool": [2, 5], "comm_strategi": [2, 55], "communicationstrategi": 2, "table_config": [2, 40], "major": [2, 4, 9, 38, 55], "arg": [2, 9, 20, 21, 22, 24, 26, 27, 30, 32, 33, 35, 40, 41, 42, 46], "abl": [2, 5, 19, 36, 55], "address": [2, 4, 5, 25, 29, 31, 34, 41, 43, 55], "challeng": [2, 10, 55], "we": [2, 4, 5, 6, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55], "etp": 2, "significantli": [2, 5, 30, 31, 32, 33, 55], "influenc": 2, "shard_matrix": [2, 40, 55], "num_gpu": [2, 23, 24, 28, 40, 42], "row": [2, 4, 9, 49, 50, 51], "place": [2, 24, 38, 40, 42, 55], "th": [2, 4], "shard_strategi": [2, 40], "mp": [2, 36, 40, 41, 56], "dp": [2, 40, 56], "t0": 2, "t1": 2, "t2": 2, "t3": 2, "And": [2, 4, 53, 55], "embedding_table_nam": [2, 5, 8, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "good": [2, 5, 41], "userid": [2, 45, 50, 51], "ebc_config": [2, 40], "num_tabl": [2, 23, 24, 28, 31, 32, 55], "sparse_embed": [2, 4], "interfac": [3, 35, 36, 38, 41, 55], "level": [3, 18, 50, 55], "createsolv": [3, 31, 40, 41, 42, 51, 53, 55], "asyncparam": [3, 55], "hybridembeddingparam": [3, 55], "datareaderparam": [3, 31, 40, 41, 42, 51, 53, 55], "createoptim": [3, 31, 40, 41, 42, 51, 53], "layer": [3, 5, 6, 7, 8, 10, 12, 13, 17, 18, 23, 25, 28, 30, 31, 32, 34, 36, 38, 40, 41, 42, 47, 48, 50, 53, 54, 55, 56], "compil": [3, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 30, 31, 33, 35, 38, 40, 41, 42, 51, 53, 55], "fit": [3, 10, 31, 36, 40, 41, 42, 50, 51, 53, 55, 56], "summari": [3, 20, 21, 22, 23, 24, 26, 27, 30, 31, 33, 40, 41, 42, 51, 53], "graph_to_json": [3, 31, 41, 42, 51, 53, 55], "construct_from_json": 3, "load_dense_weight": 3, "load_dense_optimizer_st": 3, "load_sparse_weight": [3, 51], "load_sparse_optimizer_st": 3, "freeze_dens": 3, "freeze_embed": [3, 51, 55], "unfreeze_dens": 3, "unfreeze_embed": [3, 55], "reset_learning_rate_schedul": 3, "set_sourc": 3, "low": [3, 5, 10, 13, 17, 18, 20, 21, 22, 24, 26, 27, 28, 32, 33, 36], "learningrateschedul": 3, "get_next": 3, "dataread": [3, 31, 40, 41, 42, 51, 53, 55], "is_eof": 3, "get_learning_rate_schedul": 3, "get_data_reader_train": 3, "get_data_reader_ev": 3, "start_data_read": 3, "set_learning_r": 3, "get_current_loss": 3, "eval": [3, 31, 40, 41, 42, 47, 51, 53, 55], "get_eval_metr": 3, "check_out_tensor": [3, 41, 55], "infer": [3, 6, 8, 10, 13, 17, 18, 19, 25, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 43, 51, 55, 56], "inferenceparam": [3, 5, 41, 55], "inferencemodel": [3, 5, 20, 21, 23, 24, 26, 55], "datageneratorparam": [3, 31, 38, 41, 55], "datagener": [3, 31, 38, 41, 55], "datasourceparam": [3, 53, 55], "input": [3, 4, 5, 6, 9, 14, 19, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 36, 38, 40, 41, 42, 44, 45, 47, 48, 50, 51, 53, 55], "embed": [3, 4, 6, 9, 10, 12, 13, 15, 17, 18, 20, 21, 23, 24, 25, 28, 29, 31, 32, 33, 34, 36, 37, 38, 42, 44, 49, 50, 52, 53, 55, 56], "distributedslotsparseembeddinghash": [3, 4, 31, 41, 42, 51, 53], "dens": [3, 4, 5, 6, 9, 10, 17, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 36, 38, 40, 41, 42, 51, 53, 55], "fullyconnect": [3, 55], "mlp": [3, 6, 26, 27, 31, 32, 33, 55], "multicross": [3, 53, 55], "fmorder2": [3, 55], "weightmultipli": 3, "elementwisemultipli": 3, "batchnorm": 3, "layernorm": 3, "concat": [3, 20, 21, 22, 23, 24, 30, 32, 33, 40, 41, 42, 51, 53, 55], "reshap": [3, 20, 21, 22, 23, 24, 26, 27, 32, 33, 41, 42, 51, 53, 55], "select": [3, 19, 55], "dropout": [3, 42, 53, 54, 55], "elu": [3, 55], "relu": [3, 22, 26, 27, 31, 32, 33, 40, 41, 42, 47, 51, 53, 54, 55], "sigmoid": [3, 22, 26, 27, 31, 32, 33, 41, 55], "interact": [3, 10, 13, 17, 19, 25, 26, 27, 29, 31, 32, 33, 34, 36, 38, 40, 43, 53, 54, 55], "reducesum": [3, 42, 55], "gru": [3, 55], "preludic": [3, 55], "scale": [3, 36, 37, 38, 50, 55], "fusedreshapeconcat": [3, 55], "fusedreshapeconcatgener": [3, 55], "softmax": [3, 22, 26, 55], "reducemean": [3, 55], "matrixmutipli": 3, "multiheadattent": [3, 55], "sequencemask": [3, 55], "gather": [3, 32, 33, 46, 55], "binarycrossentropyloss": [3, 31, 40, 41, 42, 51, 53], "crossentropyloss": [3, 55], "multicrossentropyloss": [3, 55], "overview": [3, 4, 5, 40], "us": [3, 4, 5, 6, 8, 9, 14, 15, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 34, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56], "known": 3, "embeddingtableconfig": [3, 40], "embeddingcollectionconfig": [3, 40, 55], "embedding_lookup": [3, 6, 9, 20, 21, 23, 24, 30, 33, 40], "shard": [3, 22, 40, 55, 56], "As": [4, 5, 20, 21, 24, 26, 27, 36, 51, 55], "domain": [4, 44, 45], "framework": [4, 10, 13, 17, 18, 20, 24, 28, 34, 35, 36, 37, 38, 39, 41, 54, 55, 56], "focu": 4, "algorithm": [4, 5, 22, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "job": [4, 20, 21, 22, 23, 24, 26, 33, 41, 55], "automat": [4, 5, 10, 24, 50, 55], "deploi": [4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 25, 26, 37, 42, 43, 55], "hardwar": [4, 5, 30, 33, 55], "complet": [4, 24, 30, 31, 32, 33, 41, 46, 55], "without": [4, 5, 18, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 53, 55], "manual": [4, 20, 21, 23, 24, 26, 55], "been": [4, 20, 24, 31, 32, 33, 41, 54, 55], "wrap": [4, 22, 27, 36, 43, 56], "meanwhil": [4, 36], "maintain": [4, 5, 10, 35, 55], "who": [4, 55], "control": [4, 5, 19, 24, 30, 31, 32, 33, 55], "friendli": 4, "alreadi": [4, 5, 31, 40, 42, 43, 49, 50, 55], "deep": [4, 10, 18, 20, 21, 22, 23, 24, 26, 30, 35, 36, 37, 38, 50, 51, 54, 55, 56], "learn": [4, 10, 18, 37, 38, 50, 54, 55, 56], "like": [4, 5, 10, 19, 53, 55, 56], "kera": [4, 20, 21, 22, 23, 24, 26, 27, 30, 33, 55], "worthwhil": 4, "switch": [4, 41, 55], "notebook": [4, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55], "workflow": [4, 6, 36, 42, 50, 51, 55], "lot": [4, 30, 55], "core": [4, 6, 20, 21, 22, 23, 24, 26, 30, 33, 34, 41, 42, 54, 55], "structur": [4, 5, 10, 31, 40, 41, 42, 53, 55], "epoch": [4, 31, 40, 41, 42, 51, 53, 55], "simpli": [4, 30, 35, 41, 54, 55], "moreov": 4, "give": [4, 30, 50, 55], "save": [4, 10, 22, 23, 24, 27, 30, 31, 32, 33, 36, 41, 42, 45, 50, 53, 55], "statu": [4, 8, 24, 30, 31, 32, 33, 41, 42, 48], "etc": [4, 19, 37, 40, 55], "return": [4, 5, 8, 9, 12, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 47, 50, 55], "custom": [4, 10, 13, 17, 24, 30, 31, 32, 33, 35, 53, 55], "model_nam": [4, 5, 6, 9, 12, 15, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "empti": [4, 5, 9, 20, 21, 24, 26, 33, 41, 55], "seed": [4, 26, 31, 40, 41, 42, 51, 53], "lr_polici": 4, "polici": [4, 5], "suppot": 4, "fix": [4, 5, 35, 55], "lrpolicy_t": 4, "lr": [4, 31, 32, 40, 41, 42, 51, 53], "schedul": [4, 5, 42, 55], "001": [4, 31, 40, 41, 42, 53], "warmup_step": [4, 31, 36, 40, 41, 42, 51, 53], "warmup": [4, 19, 31, 40, 41, 42, 51, 53], "within": [4, 5, 10, 13, 23, 38, 43, 47, 48, 54, 55], "decay_start": [4, 31, 36, 40, 41, 42, 51, 53], "decai": [4, 36], "decay_step": [4, 31, 36, 40, 41, 42, 51, 53], "decay_pow": [4, 31, 40, 41, 42, 51, 53], "power": [4, 5, 19, 31, 38, 41, 55], "end_lr": [4, 31, 40, 41, 42, 51, 53], "max_eval_batch": [4, 31, 40, 41, 42, 51, 53, 55], "equal": [4, 5, 19, 21, 23, 27, 28, 41, 55], "bigger": [4, 50], "bathc": 4, "100": [4, 5, 19, 23, 27, 28, 30, 40, 47, 48, 51, 53], "batchsize_ev": [4, 31, 40, 41, 42, 51, 53, 55], "minibatch": 4, "2048": [4, 6, 30, 47, 49, 51], "here": [4, 19, 20, 21, 22, 23, 24, 25, 26, 29, 30, 34, 35, 36, 38, 40, 41, 43, 53, 54], "worker": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "vvgpu": [4, 31, 40, 41, 42, 51, 53], "physic": 4, "numa": [4, 31, 40, 41, 42, 51, 53, 55], "possibl": [4, 18, 36, 41, 55], "repeat_dataset": [4, 31, 40, 41, 42, 51, 53], "repeat": [4, 19, 47], "otherwis": [4, 5, 24, 42, 55], "use_mixed_precis": [4, 5, 31, 51, 53], "enable_tf32_comput": 4, "acceler": [4, 6, 17, 30, 33, 36, 37, 38, 39, 50, 55, 56], "fullyconnectedlay": [4, 36], "interactionlay": [4, 36, 55], "scaler": [4, 5, 31, 40, 41, 42, 51, 53], "metrics_spec": [4, 40], "metric": [4, 6, 19, 20, 21, 24, 26, 30, 34, 55], "auc": [4, 31, 41, 42, 51, 53, 55], "averageloss": [4, 40], "hitrat": [4, 55], "threshold": [4, 5, 20, 21, 22, 23, 24, 26, 31, 32, 33, 41, 55], "metricstyp": [4, 40], "8025": 4, "termin": [4, 35], "reach": [4, 19], "i64_input_kei": [4, 5, 23, 28, 30, 31, 33, 40, 41, 42, 51, 53], "choos": [4, 40, 53], "nvtabular": [4, 38, 43, 44, 45, 51, 52, 55], "use_algorithm_search": [4, 5], "search": [4, 5, 30, 31, 32, 33, 55], "cublasgemmex": [4, 5], "use_cuda_graph": [4, 5, 31, 41, 53, 55], "cuda": [4, 5, 24, 28, 30, 31, 32, 33, 40, 41, 42, 43, 47, 48, 51, 53, 55], "asyncdataread": 4, "hybridembed": 4, "task": [4, 5, 10, 19, 20, 21, 22, 23, 24, 25, 26, 28, 33, 35, 36, 41, 43, 44, 46, 55], "pack": [4, 5, 20, 21, 22, 23, 24, 28, 32, 33, 51, 55], "device_layout": 4, "longer": [4, 50, 55], "train_intra_iteration_overlap": [4, 55], "detect": [4, 30, 31, 32, 33], "toplogi": [4, 55], "tri": [4, 5], "train_inter_iteration_overlap": [4, 55], "fetch": [4, 46, 55], "next": [4, 30, 32, 46, 47, 50, 51, 55], "earlier": 4, "eval_intra_iteration_overlap": [4, 55], "knob": [4, 55], "similar": [4, 30, 31, 32, 33, 50, 55], "eval_inter_iteration_overlap": [4, 55], "all_reduce_algo": [4, 55], "allreducealgo": [4, 55], "oneshot": 4, "multi": [4, 5, 21, 34, 35, 38, 42, 43, 45, 46, 50, 53, 54, 55], "requir": [4, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 49, 50, 51, 53, 55], "run": [4, 5, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 41, 42, 47, 48, 53, 54, 55], "grouped_all_reduc": 4, "gradient": [4, 20, 21, 22, 24, 26, 27, 33, 55], "effect": [4, 24, 44, 46, 55], "small": [4, 5, 6, 38, 40, 41, 46, 55], "higher": [4, 5, 24, 46, 55], "hybrid": [4, 6, 27, 55], "num_iterations_statist": 4, "statist": [4, 5, 50], "300": [4, 22, 40, 47, 51, 53], "16384": [4, 6, 8, 30, 41, 54], "read": [4, 5, 30, 31, 32, 33, 38, 41, 46, 47, 50, 53, 54, 55], "done": [4, 26, 30, 31, 40, 41, 42, 50, 51, 53], "async_param": 4, "linux": [4, 24, 31, 41], "aio": 4, "peak": [4, 30, 31, 32, 33], "throughput": [4, 5, 19, 30, 36, 55], "num_thread": [4, 5, 55], "least": [4, 5, 9, 24, 28, 55], "num_batches_per_thread": 4, "work": [4, 8, 14, 18, 20, 21, 22, 26, 30, 35, 41, 50, 55], "simultan": [4, 36, 56], "max_num_requests_per_thread": 4, "io": [4, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 42, 43, 50, 53, 55], "request": [4, 5, 6, 19, 24, 30, 31, 32, 33, 35, 41, 50, 55], "72": [4, 23, 33, 34, 47], "most": [4, 5, 13, 19, 30, 33, 41, 55], "multi_hot_read": 4, "io_depth": 4, "queue": [4, 5, 6, 30, 55], "io_align": [4, 55], "byte": [4, 5, 10, 28, 30, 31, 32, 33, 41, 47, 50], "align": [4, 28, 55], "4096": [4, 6, 30, 31, 32, 33, 34, 41], "shuffl": [4, 32, 42, 50], "fed": [4, 30, 38], "aligned_typ": 4, "alignment_t": 4, "auto": [4, 24, 31, 32, 33, 41], "chosen": [4, 5], "obtain": [4, 10, 13, 20, 21, 22, 23, 24, 26, 27, 28, 30, 38, 40, 42, 50, 53], "unsign": 4, "is_dense_float": 4, "except": [4, 20, 21, 22, 23, 24, 26, 27, 28, 40, 41, 42, 46, 47, 53, 55], "thrown": 4, "param": [4, 20, 21, 22, 23, 24, 26, 30, 33], "16": [4, 5, 8, 9, 10, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 40, 41, 42, 47, 50, 51, 53, 54, 55], "overcom": [4, 55], "constraint": [4, 5, 30, 55], "impos": [4, 30, 55], "part": [4, 5, 19, 30, 37, 45, 55], "traffic": [4, 55], "over": [4, 5, 19, 35, 50, 54, 55], "improv": [4, 5, 22, 36, 44, 55], "deploy": [4, 5, 6, 10, 18, 20, 21, 24, 26, 30, 34, 35, 36, 55], "convers": [4, 30, 33, 41, 42, 55], "encod": [4, 51], "hybrid_embedding_param": 4, "max_num_frequent_categori": 4, "frequent": [4, 5, 50, 55], "categori": [4, 5, 30, 36, 50, 51, 55], "max_num_infrequent_sampl": 4, "infrequ": [4, 55], "p_dup_max": 4, "probabl": [4, 19, 38], "appear": [4, 19, 30, 38, 55], "onc": [4, 8, 33, 35, 41, 50, 55], "wai": [4, 10, 13, 17, 19, 25, 29, 30, 34, 38, 40, 43, 50, 54, 55], "determin": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "nvlink": [4, 34], "max_all_reduce_bandwidth": 4, "max_all_to_all_bandwidth": [4, 55], "efficiency_bandwidth_ratio": 4, "communication_typ": [4, 55], "being": [4, 19, 46, 55], "communicationtyp": [4, 55], "ib_nvlink": [4, 55], "ib_nvlink_hi": [4, 55], "nvlink_singlenod": 4, "protocol": [4, 42, 46, 47, 48, 55], "infiniband": [4, 5], "roce": [4, 55], "special": [4, 36], "gid": [4, 55], "hugectr_roce_gid": [4, 55], "hugectr_roce_tc": [4, 55], "hybrid_embedding_typ": 4, "hybridembeddingtyp": 4, "now": [4, 22, 30, 31, 32, 33, 42, 46, 49, 50, 55], "01": [4, 19, 24, 26, 27, 30, 31, 32, 33, 40, 41, 44, 47, 51, 53, 55], "3e11": 4, "9e11": 4, "warn": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "data_reader_typ": [4, 31, 40, 41, 42, 51, 53], "datareadertype_t": [4, 31, 40, 41, 42, 51, 53, 55], "file_list": [4, 31, 38, 41, 53], "txt": [4, 31, 38, 40, 41, 42, 51, 53, 55], "train_data": 4, "bin": [4, 19, 41, 49], "keyset": [4, 55], "show": [4, 5, 8, 18, 19, 20, 24, 25, 26, 33, 40, 41, 46, 54, 55], "eval_sourc": [4, 31, 40, 41, 42, 51, 53], "check_typ": [4, 31, 40, 41, 42, 51, 53], "mechan": [4, 5, 38, 41, 42, 55], "check_t": [4, 31, 40, 41, 42, 51, 53], "checksum": [4, 53], "cache_eval_data": 4, "num_sampl": [4, 20, 21, 22, 24, 26, 27, 32, 33, 55], "eval_num_sampl": 4, "float_label_dens": 4, "interpret": [4, 55], "log": [4, 25, 29, 30, 31, 32, 33, 34, 35, 38, 41, 42, 43, 54, 55], "f": [4, 19, 20, 21, 22, 23, 24, 28, 30, 32, 33, 35, 41, 42, 46, 47, 48, 49, 51], "num_work": [4, 32, 55], "concurr": [4, 5, 19, 30, 55], "empir": 4, "data_source_param": [4, 53, 55], "hdf": [4, 5, 35, 43, 55], "aw": [4, 5, 35, 43, 55], "s3": [4, 5, 35, 43, 55], "googl": [4, 55], "cloud": [4, 13, 17, 25, 29, 34, 43, 55], "async": [4, 41, 55], "fig": [4, 10, 17, 18, 31, 32, 33, 36, 38, 54], "minimum": [4, 6, 25, 29, 30, 34, 35, 43, 55], "granular": [4, 55], "header": [4, 24, 38, 41, 42, 55], "tabular": [4, 44, 50], "alwai": [4, 9, 55], "constant": [4, 30, 32, 33, 41], "payment": 4, "preced": [4, 18, 55], "yellow": 4, "box": [4, 50], "depict": 4, "reserv": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "signific": [4, 5, 22, 41], "exclud": 4, "charg": [4, 41], "definit": [4, 41], "typedef": 4, "struct": [4, 20, 21, 22, 23, 24, 26, 27, 28, 32, 33, 51, 55], "datasetheader_": 4, "error_check": 4, "check_num": 4, "number_of_record": 4, "datasethead": 4, "data_": 4, "check_sum": 4, "char": [4, 15, 41], "checkbit": 4, "slot_": 4, "changeabl": 4, "45": [4, 23, 30, 32, 33, 40, 41, 42, 47, 51, 53, 54], "67": [4, 23, 47], "undefin": [4, 31, 55], "behavior": [4, 5, 30, 41, 55], "given": [4, 9, 45], "assign": [4, 5, 24, 30, 31, 32, 33, 35, 41, 51, 55], "line": [4, 30, 33, 40, 41, 42, 43, 55], "path": [4, 5, 19, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 40, 42, 45, 46, 47, 50, 51, 53, 55], "cat": [4, 28, 42, 50, 53], "simple_sparse_embedding_file_list": 4, "simple_sparse_embed": 4, "simple_sparse_embedding0": 4, "simple_sparse_embedding1": 4, "simple_sparse_embedding2": 4, "simple_sparse_embedding3": 4, "simple_sparse_embedding4": 4, "simple_sparse_embedding5": 4, "simple_sparse_embedding6": 4, "simple_sparse_embedding7": 4, "simple_sparse_embedding8": 4, "simple_sparse_embedding9": 4, "wdl_norm": 4, "file_list_test": [4, 31, 38, 41, 53], "aspect": 4, "datatyp": [4, 24, 31, 32, 33, 41], "outperform": 4, "disk": [4, 30, 45, 50, 55], "feed": [4, 33, 38, 41, 50], "go": [4, 35, 40, 41, 42, 43, 50], "incorpor": [4, 13], "3g": [4, 55], "wdl_raw": 4, "validation_data": 4, "column": [4, 41, 42, 45, 49, 50, 51, 55], "orient": 4, "open": [4, 5, 10, 13, 17, 20, 21, 22, 23, 24, 28, 30, 31, 32, 33, 36, 38, 39, 41, 46, 47, 48, 49, 51, 55], "free": [4, 41, 42, 55], "apach": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "hadoop": [4, 35, 36, 43, 53, 55], "ecosystem": 4, "compress": [4, 38], "nest": [4, 55], "loader": [4, 23, 24, 28, 30, 31, 32, 33, 41], "miss": [4, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 47, 51, 55], "int64": [4, 5, 9, 10, 12, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 41, 42, 49, 50, 55], "arrang": 4, "numer": [4, 5, 38, 44], "separ": [4, 5, 10, 20, 21, 24, 26, 27, 31, 41, 50, 55], "_metadata": [4, 50, 53, 55], "file_stat": [4, 53], "file_nam": [4, 53], "file0": 4, "num_row": [4, 53], "409600": 4, "file1": 4, "col_nam": [4, 53], "c1": [4, 53], "c2": [4, 53], "c3": [4, 53], "c4": [4, 53], "cont": [4, 42, 53], "i1": 4, "i2": 4, "i3": 4, "parquet_data": 4, "_file_list": [4, 40, 42, 51], "val": [4, 31, 40, 41, 42, 53], "50000": [4, 24], "20000": [4, 20, 21, 24, 42], "whose": [4, 24, 25, 26, 40, 55], "duplic": [4, 36, 50, 55], "ensur": [4, 5, 8, 13, 19, 23, 28, 30, 41, 50, 55], "snippet": 4, "0th": 4, "1st": [4, 21, 40], "third": [4, 18, 19, 35, 43, 55], "60000": 4, "entri": [4, 21, 22, 26, 33, 55], "resid": 4, "folder": [4, 19, 24, 26, 30, 31, 40, 41, 55], "basic": [4, 9, 10, 12, 41], "four": [4, 55], "frame": 4, "edit": [4, 35], "desir": [4, 10, 30, 41, 55], "chang": [4, 5, 19, 20, 21, 26, 30, 36, 50, 55, 56], "hyperparamet": [4, 36, 41], "well": [4, 50, 55], "meticul": 4, "update_typ": [4, 31, 40, 42, 53], "hit": [4, 5, 19, 20, 21, 22, 23, 24, 26, 31, 32, 33, 41, 50, 51, 55], "lazyglob": 4, "semant": [4, 55], "optimizer_typ": [4, 31, 40, 41, 42, 51, 53], "optimizer_t": [4, 31, 40, 41, 42, 51, 53], "update_t": [4, 31, 40, 42, 53], "beta1": [4, 31, 42], "9": [4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 38, 41, 42, 47, 48, 53], "beta2": [4, 31, 42], "999": [4, 31, 42], "lambda1": 4, "lambda2": 4, "momentum_factor": 4, "atomic_upd": [4, 40, 53], "atom": [4, 41], "0000001": [4, 42], "groupdens": 4, "hugectr_layer_book": 4, "trane": 4, "reader_param": 4, "groupdenselay": [4, 55], "embeddingcollect": 4, "seri": [4, 37, 43, 44], "taken": [4, 9], "dense_lay": 4, "overload": [4, 50, 55], "flexibli": 4, "buffer": [4, 5, 26, 41, 55], "loss_nam": 4, "loss_weight": 4, "match": [4, 5, 8, 24, 30, 38], "through": [4, 5, 10, 13, 36, 37, 38, 39, 41, 45, 47, 49, 50, 55], "num_epoch": [4, 55], "max_it": [4, 31, 40, 41, 42, 51, 53, 55], "2000": [4, 19, 21, 42, 51, 53], "displai": [4, 31, 40, 41, 42, 43, 51, 53, 55], "200": [4, 24, 26, 27, 30, 31, 40, 41, 51, 53], "eval_interv": [4, 31, 40, 41, 42, 51, 53], "execut": [4, 6, 8, 10, 24, 30, 33, 35, 41, 47, 48, 51, 55], "1000": [4, 10, 19, 21, 27, 28, 31, 40, 41, 42, 47, 51, 53, 55], "invalid": 4, "remot": [4, 5, 43, 55], "gc": [4, 5, 53, 55], "localhost": [4, 5, 6, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 41, 55], "9000": [4, 5, 42, 53, 55], "dir": [4, 5, 19, 30, 31, 32, 33, 50], "virtual": [4, 5, 41], "style": [4, 5, 55], "region": [4, 5, 53], "offici": [4, 5, 55], "uri": [4, 5, 55], "bucket": [4, 5], "url": [4, 5, 18, 24, 35, 46, 55], "http": [4, 5, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 45, 47, 48, 49, 50, 53, 55], "googleapi": [4, 5, 40, 42, 53], "com": [4, 5, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 47, 49, 50, 53, 55], "mpi": [4, 31, 40, 41, 42, 43, 51, 53, 55], "print": [4, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 46, 47, 50, 51, 55], "graph_config_fil": [4, 42, 51, 53], "fine": [4, 55], "tune": 4, "include_dense_network": 4, "whole": [4, 10, 30, 36, 56], "dense_opt_states_fil": [4, 55], "\u2170": 4, "sparse_embedding_fil": 4, "\u2171": 4, "sparse_embedding_files_map": 4, "dict": [4, 8, 20, 21, 22, 24, 26, 27, 32, 33, 41, 46], "sparse_embedding2": [4, 5, 41, 42], "358": [4, 24], "wdl_0_sparse_4000": 4, "wdl_1_sparse_4000": 4, "sparse_opt_states_fil": [4, 55], "sparse_opt_states_files_map": 4, "freez": [4, 32], "criteo": [4, 30, 38, 40, 42, 54, 55], "embedding_nam": 4, "unfreez": 4, "reset": [4, 41, 55], "base_lr": 4, "under": [4, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 50, 53, 55], "On": [4, 8, 40, 55], "basi": [4, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "expos": 4, "elabor": 4, "datareader32": 4, "datareader64": 4, "re": [4, 30, 35, 38, 41, 46, 55], "form": [4, 25, 38, 41, 55], "begin": [4, 5, 28, 30, 33], "train_data_read": 4, "eval_data_read": 4, "enter": [4, 41], "loop": [4, 22, 33, 41, 50], "later": [4, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 50, 55], "emb_vector": [4, 9, 10, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 51, 53], "distributedslotembed": [4, 36], "slot_id": 4, "localizedslotembed": [4, 36], "info": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "nth": 4, "suffix": [4, 41], "latest": [4, 55], "via": [4, 5, 6, 10, 28, 30, 41, 49, 55], "numpi": [4, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 47, 48, 49, 50, 51, 55], "float32": [4, 9, 10, 12, 14, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 49, 50, 55], "float16": 4, "flow": 4, "debug": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 40, 41, 42, 53, 55], "correct": [4, 30, 41, 55], "intermedi": [4, 5, 35, 55], "easili": [4, 10, 20, 28, 38, 50, 55], "tensor_nam": 4, "tensor_typ": 4, "tensor_t": [4, 41], "1280": [4, 24, 53], "75": [4, 6, 10, 13, 17, 23, 32, 33, 38, 42, 47], "concat1": [4, 26, 27, 30, 33, 41, 42, 51, 53], "sparse_embedding1_train_flow": 4, "fc1_evaluate_flow": 4, "inferencesess": [4, 41], "server": [4, 6, 19, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 35, 37, 43, 48, 53, 54, 55], "tensorflow": [4, 5, 6, 8, 17, 18, 20, 21, 22, 23, 25, 26, 27, 34, 35, 36, 37, 38, 41, 43, 55, 56], "tensorrt": [4, 5, 6, 15, 18, 24, 43, 55], "purpos": [4, 38, 43, 50, 55], "triton": [4, 5, 6, 17, 18, 25, 34, 35, 38, 55], "deriv": [4, 10], "besid": [4, 20, 22, 24, 55], "session": [4, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "model_config_path": 4, "inference_param": 4, "max_batchs": [4, 5, 41], "num_batch": [4, 55], "40000": [4, 24], "40960": [4, 31, 41, 53], "960": 4, "cardin": [4, 51], "suitabl": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 45, 53, 55], "model_config": 4, "dcn_dense_1000": 4, "dcn0_sparse_1000": 4, "deployed_devic": [4, 5, 41], "use_gpu_embedding_cach": [4, 5, 41, 55], "cache_size_percentag": [4, 5, 41], "inference_model": [4, 20, 21, 26], "pred": [4, 23, 28, 32, 41], "embed_vec_s": [4, 9, 20, 22, 24, 26, 27, 30, 32, 33], "sparse_embedding1_inference_flow": 4, "acknowledg": 4, "synthet": [4, 30, 31, 41, 45, 46, 55], "num_slot": [4, 31, 41, 55], "paruqet": 4, "test_data": 4, "nnz_arrai": [4, 31, 41], "simul": [4, 55], "dist_typ": [4, 31, 41], "distribution_t": [4, 31, 41], "powerlaw": [4, 19, 31, 41], "power_law_typ": [4, 31, 41], "law": [4, 20, 21, 22, 23, 24, 26, 27, 28, 31, 38, 40, 41, 42, 53, 55], "powerlaw_t": [4, 31, 41], "alpha": [4, 19, 31, 32, 38, 41, 55], "medium": [4, 37, 55], "short": [4, 31, 37, 41, 55], "num_fil": [4, 31, 41], "eval_num_fil": [4, 31, 41], "num_samples_per_fil": [4, 31, 41], "5242880": [4, 53], "1310720": 4, "regard": [4, 5, 6, 55], "data_generator_param": [4, 31, 41], "encapsul": [4, 13, 55], "datasourc": 4, "hugect": 4, "filesystemtype_t": [4, 53], "ip": [4, 5, 25, 29, 30, 34, 43, 47, 48, 53], "cluster": [4, 5, 10, 24, 33, 36, 38, 42, 53, 55, 56], "namenod": [4, 53, 55], "endpoint": [4, 5, 53], "put": [4, 49], "Will": 4, "listen": [4, 5], "huge": 5, "further": [5, 55], "grant": 5, "abil": [5, 18, 55], "perman": 5, "demo": [5, 19, 36, 55], "offer": [5, 18, 55, 56], "superior": 5, "cpu": [5, 6, 8, 10, 18, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 41, 43, 47, 48, 50, 54, 55], "counterpart": [5, 6, 55], "although": [5, 55], "modern": 5, "center": 5, "nvidia": [5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 49, 50, 53, 54, 55], "increas": [5, 30, 54, 55], "ai": [5, 36], "come": [5, 55], "spearhead": 5, "vastli": [5, 55], "clsuter": 5, "ram": [5, 10], "asid": 5, "retain": [5, 55], "hdd": [5, 10], "sdd": [5, 10], "magnitud": [5, 30], "ddr": 5, "hbm": [5, 27, 55], "cost": 5, "throughout": [5, 55], "latenc": [5, 6, 10, 13, 17, 18, 19, 20, 24, 28, 30, 34, 36, 41, 55], "drr": 5, "act": 5, "therebi": 5, "respons": [5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 53], "redi": [5, 55], "retriev": [5, 9, 10, 13, 17, 20, 24, 26, 28, 36, 55], "rdb": [5, 41], "aof": [5, 41], "seamless": 5, "restart": [5, 41, 46, 47, 48], "particip": 5, "claim": 5, "guarante": [5, 33, 41, 55], "statement": [5, 13, 17, 43], "hiredi": [5, 41], "love": 5, "hear": 5, "experi": [5, 10, 19, 25, 29, 34, 43, 55], "let": [5, 41, 50, 55], "successfulli": [5, 10, 24, 25, 29, 30, 31, 32, 33, 34, 36, 41, 42, 43, 53], "unsuccessfulli": 5, "target": [5, 19, 35, 36, 41, 43, 46, 50, 51, 54, 55], "link": [5, 10, 24, 30, 38, 40, 42, 46, 49, 55], "consid": [5, 20, 21, 26, 36, 49], "compliment": 5, "expand": 5, "capabl": [5, 20, 21, 22, 23, 24, 26, 31, 33, 35, 41, 55, 56], "capac": [5, 18, 36], "entir": [5, 55], "whatev": 5, "reason": [5, 24, 43], "becom": [5, 38, 55], "unavail": [5, 55], "respond": [5, 35], "though": 5, "properti": [5, 50], "emphas": 5, "rough": 5, "guidelin": 5, "often": [5, 44], "ethernet": 5, "rel": 5, "practic": [5, 36], "gb": [5, 25, 29, 34, 40, 41, 42, 43], "few": 5, "tb": [5, 55], "mainten": 5, "stream": [5, 23, 28, 30, 33, 41, 46, 55], "extern": [5, 45, 50], "kafka": [5, 55], "downtim": 5, "retrain": [5, 30], "logic": [5, 9], "whenev": 5, "engin": [5, 6, 17, 18, 24, 34, 42, 50, 52, 55], "associ": [5, 55], "resolv": [5, 31, 40, 41, 42, 51, 53, 55], "turn": [5, 6, 23, 50, 55], "represent": 5, "fill": [5, 40, 41], "publish": [5, 41], "certain": 5, "ingest": [5, 55], "stage": [5, 19, 20, 21, 24, 26, 30, 31, 32, 33, 38, 54, 55], "suffici": [5, 55], "attempt": [5, 30, 31, 32, 33, 55], "minim": [5, 35, 55, 56], "recent": [5, 55], "lru": 5, "volatiledatabaseparam": [5, 41], "persistentdatabaseparam": 5, "updatesourceparam": 5, "These": [5, 10, 13, 17, 26, 33, 38, 44, 55], "packag": [5, 10, 17, 22, 24, 26, 30, 32, 33, 36, 38, 46, 47, 48, 49, 50, 55, 56], "supportlonglong": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "fuse_embedding_t": [5, 23, 28, 30, 33, 55], "volatile_db": [5, 41], "persistent_db": 5, "update_sourc": 5, "At": [5, 40], "origin": [5, 26, 38, 54, 55], "synchron": [5, 19, 30, 35, 55], "plugin": [5, 6, 18, 22, 23, 25, 26, 28, 29, 35, 37, 38, 43, 55], "torch": [5, 17, 18, 29, 32, 41, 47, 48, 55], "describ": [5, 36], "speak": 5, "rare": [5, 40, 55], "might": [5, 30, 32], "sens": 5, "vari": 5, "heterogen": 5, "network_fil": [5, 19], "number_of_refresh_buffers_in_pool": 5, "thread_pool_s": [5, 28, 33], "cache_refresh_percentage_per_iter": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 55], "default_value_for_each_t": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "maxnum_des_feature_per_sampl": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "embedding_cache_typ": [5, 23, 28, 30, 55], "refresh_delai": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "refresh_interv": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "maxnum_catfeature_query_per_table_per_sampl": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "embedding_vecsize_per_t": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "divis": 5, "device_id": [5, 26, 41], "devicelist": 5, "goe": 5, "directli": [5, 20, 21, 24, 26, 27, 33, 38, 41, 47, 55], "uvm": [5, 55], "No": [5, 20, 21, 23, 24, 26, 30, 31, 32, 33, 40], "percentag": [5, 6, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "pool": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "refresh": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "increment": [5, 50, 55], "occur": [5, 31, 55], "frequenc": [5, 30, 55], "volum": 5, "std": [5, 41, 47, 55], "hardware_concurr": [5, 55], "delai": [5, 19], "wait": [5, 28, 30, 35, 41, 45], "timer": [5, 41], "servic": [5, 10, 20, 21, 22, 26, 30, 33, 55], "period": [5, 36], "partit": [5, 50, 55], "use_context_stream": [5, 23, 28, 30, 33], "context": [5, 23, 28, 30, 33, 41], "sparse_fil": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "wdl_infer": [5, 19], "wdl0_sparse_20000": 5, "wdl1_sparse_20000": 5, "dense_fil": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "wdl_dense_20000": 5, "num_of_worker_buffer_in_pool": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "num_of_refresher_buffer_in_pool": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "deployed_device_list": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "max_batch_s": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "table1": [5, 23, 28], "table2": [5, 23, 28], "gpucachep": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "gpucach": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "back": [5, 24, 41, 55], "indvidu": 5, "collabor": 5, "inject": 5, "underli": [5, 10, 13, 17, 38, 55], "redis_clust": [5, 41], "127": [5, 26, 30, 41, 42], "7000": [5, 41, 42], "user_nam": 5, "password": 5, "num_partit": [5, 41], "allocation_r": 5, "268435456": 5, "mib": [5, 30, 31, 32, 33], "shared_memory_s": 5, "17179869184": [5, 41], "gib": [5, 42], "shared_memory_nam": 5, "hctr_mp_hash_map_databas": [5, 41], "shared_memory_auto_remov": [5, 41], "65536": [5, 6, 20, 30, 40], "enable_tl": [5, 41, 55], "tls_ca_certif": [5, 41, 55], "cacertbundl": 5, "crt": [5, 41], "tls_client_certif": [5, 41, 55], "client_cert": 5, "pem": [5, 41], "tls_client_kei": [5, 41, 55], "client_kei": 5, "tls_server_name_identif": [5, 41, 55], "overflow_margin": 5, "overflow_polici": 5, "databaseoverflowpolicy_t": 5, "enum_valu": 5, "overflow_resolution_target": 5, "initialize_after_startup": [5, 41], "initial_cache_r": 5, "cache_missed_embed": 5, "update_filt": 5, "filter": [5, 30], "7003": 5, "7004": 5, "7005": 5, "10000000": [5, 40, 42], "evict_random": 5, "hash_map": 5, "multi_process_hash_map": [5, 41, 55], "live": [5, 24], "dev": [5, 41, 42, 55], "shm": [5, 41, 55], "parallel_hash_map": 5, "degre": 5, "hashmap": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "split": [5, 30, 42, 47, 55], "evenli": 5, "min": [5, 19, 21, 31, 32, 33], "number_of_cpu_cor": 5, "build": [5, 6, 17, 18, 24, 25, 29, 34, 36, 41, 47, 50, 53, 55, 56], "denot": 5, "word": [5, 9, 41], "upper": 5, "bound": 5, "latter": 5, "particularli": [5, 38], "imag": [5, 25, 29, 34, 35, 38, 43, 44, 46, 47, 49, 51, 52], "insuffici": 5, "nativ": [5, 6, 10, 18, 19, 23, 25, 30, 31, 32, 36, 41, 55], "doc": [5, 24, 30, 31, 32, 33, 41, 55], "symbol": [5, 31, 42], "attach": [5, 41], "remov": [5, 35, 40, 41, 50, 55], "disconnect": [5, 41], "program": [5, 30, 31, 32, 33, 41, 43, 55], "pattern": [5, 55], "account": [5, 50], "divid": [5, 9], "num_paritit": 5, "strictli": 5, "incur": [5, 55], "overhead": [5, 6, 22, 30, 55], "too": [5, 41, 50, 55], "5x": [5, 24, 55], "mass": 5, "chunk": [5, 35, 50, 55], "transmiss": 5, "stabil": [5, 30], "1000000": [5, 53], "conjunct": [5, 55], "262143": 5, "18": [5, 19, 23, 30, 32, 33, 41, 47, 51, 53], "lead": [5, 35, 36, 37, 55], "obscur": 5, "therefor": [5, 30, 35, 41, 55], "tl": [5, 55], "ssl": [5, 55], "secur": [5, 50], "encrypt": [5, 41, 55], "slightli": [5, 55], "filesystem": [5, 30, 55], "certif": [5, 41], "ca": [5, 41], "client": [5, 19, 24, 30, 31, 32, 33, 41, 42, 55], "privat": [5, 41], "sni": 5, "instabl": 5, "sporad": 5, "consumpt": [5, 55], "occupi": [5, 24, 30, 33, 42], "ideal": 5, "100000000": [5, 50], "reliabl": [5, 50], "condit": [5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "prune": 5, "conduct": [5, 6, 28, 29, 55], "until": [5, 19, 20, 21, 24, 26, 41, 55], "evict_least_us": 5, "lfu": 5, "effort": [5, 55], "evict_oldest": 5, "complic": [5, 41, 50, 56], "comparison": [5, 54, 55], "faster": [5, 54, 55], "deliv": [5, 55], "evict": [5, 41, 55], "doubl": [5, 9, 41], "fraction": 5, "keep": 5, "exactli": [5, 9, 55], "shrunk": 5, "80": [5, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 31, 32, 33, 35, 38, 41, 42, 43, 47], "surpass": 5, "content": [5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 41, 42, 53, 55], "previous": [5, 55], "reconnect": 5, "rocksdb": [5, 55], "materi": [5, 50], "immedi": 5, "upon": [5, 55], "startup": [5, 30, 55], "50": [5, 20, 22, 23, 24, 30, 32, 33, 41, 42], "anoth": [5, 41, 42, 55], "written": [5, 20, 21, 24, 26, 30, 33, 43], "send": [5, 6, 24, 30, 31, 32, 33, 41, 55], "hps_": 5, "databasetype_t": [5, 41], "tmp": [5, 32, 42], "read_onli": 5, "rocks_db": 5, "datatabas": 5, "prevent": [5, 38, 41, 55], "found": [5, 9, 20, 21, 23, 24, 26, 30, 32, 33, 36, 40, 41, 43, 51, 53], "Be": 5, "awar": [5, 31], "overwrit": [5, 22, 23, 24, 26, 30, 33, 40, 51, 53], "driver": [5, 40], "nf": 5, "kept": [5, 6], "sync": 5, "kafka_message_queu": 5, "broker": [5, 55], "metadata_refresh_interval_m": 5, "30000": [5, 20, 21, 24], "poll_timeout_m": 5, "500": [5, 40, 51, 53], "receive_buffer_s": 5, "262144": 5, "8192": [5, 6, 30, 40], "failure_backoff_m": 5, "max_commit_interv": 5, "9092": 5, "null": [5, 15, 41, 55], "semicolon": 5, "delimit": 5, "pair": [5, 38, 42, 51], "topic": [5, 10, 36], "metadata": [5, 35, 45, 46, 50, 55], "download": [5, 19, 30, 35, 40, 42, 44, 46, 49, 52, 55], "send_buffer_s": 5, "kafkamessagesink": 5, "push": 5, "millisecond": [5, 55], "dispatch": [5, 22, 26], "fail": [5, 24, 42], "success": [5, 6, 8, 30, 31, 35, 41, 42, 51, 53], "temporarili": 5, "unreach": 5, "retri": 5, "commit": 5, "independ": [5, 13, 24, 30, 31, 32, 33, 55], "were": [5, 20, 21, 22, 24, 30, 33, 50, 54, 55], "sinc": [5, 23, 24, 30, 31, 32, 33, 36, 38, 40, 41, 55], "create_tf_model": 6, "py": [6, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 50, 51, 53, 55], "savedmodel": [6, 8, 21, 25, 26, 30, 33, 55], "16gb": [6, 51, 54], "almost": [6, 20, 21, 24, 26, 54], "furthermor": 6, "create_trt_engin": 6, "summar": [6, 10, 25, 29, 30, 34, 43, 52], "onnx": [6, 17, 43, 55], "surgeri": [6, 17], "experiment": [6, 23, 27, 41, 55], "variablepolici": 6, "save_variable_devic": 6, "common": [6, 24, 26, 27, 36, 53, 54, 56], "baselin": 6, "nn": [6, 9, 10, 12, 20, 21, 22, 24, 28, 30, 32, 33, 47], "lookuplay": [6, 7, 8, 11, 22, 23, 26, 28], "unchang": 6, "integr": [6, 10, 17, 18, 20, 34, 37, 55], "built": [6, 18, 20, 21, 24, 26, 30, 34, 35, 36, 47, 55], "optimum": 6, "131072": 6, "investig": [6, 41], "sxm4": [6, 34], "80gb": [6, 34, 36], "trt": [6, 15, 25, 30, 31, 32, 33, 43, 55], "hps_tensorflow_triton_deployment_demo": [6, 25], "demo_for_tf_trained_model": [6, 34], "repeatedli": [6, 22, 33, 41], "analyz": [6, 30, 55], "serv": [6, 18, 30, 33, 36, 55], "studi": [6, 55], "measur": [6, 30, 50, 55], "perf_analyz": [6, 19, 30], "8000": [6, 24, 30, 31, 32, 33, 42], "categorical_featur": [6, 30, 31, 32, 33], "numerical_featur": [6, 30, 31, 32, 33], "276633": 6, "7912898": 6, "7946796": 6, "7963854": 6, "7971191": 6, "7991237": 6, "7991368": 6, "7998351": 6, "7999728": 6, "8014930": 6, "13554004": 6, "14136456": 6, "14382203": 6, "14382219": 6, "14384425": 6, "14395091": 6, "14395194": 6, "14395215": 6, "14396165": 6, "14671338": 6, "22562171": 6, "25307802": 6, "32394527": 6, "32697105": 6, "32709007": 6, "32709104": 6, "76171875": 6, "806640625": 6, "609375": 6, "04296875": 6, "7919921875": 6, "0986328125": 6, "9453125": [6, 33], "38671875": 6, "3984375": 6, "9462890625": 6, "side": [6, 19, 24, 30, 55], "report": [6, 24, 30, 55], "count": [6, 24, 26, 27, 30, 31, 32, 33, 46], "28589": 6, "avg": [6, 30], "562": [6, 41, 47], "usec": [6, 30, 34], "59": [6, 20, 23, 33, 40, 47, 51, 53, 55], "431": [6, 41], "53": [6, 19, 23, 26, 40, 47, 51, 53], "merlin": [6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 41, 42, 43, 50, 53, 55], "nvcr": [6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 43, 55], "02": [6, 10, 17, 25, 30, 33, 34, 41, 44, 45, 47, 51, 53], "amd": [6, 34], "epyc": [6, 34], "7742": [6, 34], "processor": [6, 34], "softwar": [6, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 46, 53, 55], "22": [6, 23, 24, 30, 32, 33, 47, 51, 53, 55], "cuda11": 6, "microsecond": 6, "figur": [6, 18], "logarithm": 6, "10x": 6, "speedup": [6, 54, 55], "551": [6, 28, 30, 40], "612": 6, "380": [6, 28, 30, 40, 42], "389": 6, "42": [6, 22, 23, 30, 31, 32, 33, 40, 41, 42, 45, 47, 50, 51], "608": [6, 40, 47, 53], "667": [6, 41, 53], "381": [6, 40], "346": [6, 47], "76": [6, 23, 30, 53], "832": 6, "639": 6, "438": [6, 47], "428": [6, 47], "94": [6, 23, 47], "1911": 6, "849": 6, "604": [6, 47], "534": [6, 40], "58": [6, 23, 30, 33, 42, 47, 51, 53], "4580": 6, "1059": 6, "927": [6, 30, 40], "766": 6, "98": [6, 23, 47, 50], "9872": 6, "1459": 6, "1446": 6, "1114": 6, "86": [6, 23, 24, 26, 40, 41, 47], "19643": 6, "2490": 6, "2432": 6, "1767": 6, "35292": 6, "4131": 6, "4355": 6, "3053": 6, "56": [6, 20, 23, 24, 26, 30, 31, 33, 34, 40, 42, 47, 51, 53], "32768": [6, 30], "54090": 6, "7795": 6, "6816": 6, "5247": 6, "31": [6, 23, 31, 32, 33, 40, 41, 42, 47, 51, 53], "107742": 6, "15036": 6, "13012": 6, "10022": 6, "213990": 6, "29374": 6, "25440": 6, "19340": 6, "06": [6, 13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 38, 40, 41, 42, 43, 44, 47, 51, 53], "init": [7, 8, 10, 19, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 40, 41, 42, 43, 51, 53, 55], "sparselookuplay": [7, 8, 10, 22], "hierarchical_parameter_serv": [8, 9, 10, 20, 21, 22, 23, 24, 26, 27, 28, 55], "kwarg": [8, 9, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "abbrevi": [8, 9], "implicitli": [8, 24, 41, 55], "ps_config_fil": [8, 9, 12, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 55], "global_batch_s": [8, 9, 20, 21, 22, 23, 24, 26, 27, 32, 33, 55], "constructor": [8, 9, 24], "safe": [8, 32, 41], "implicit": [8, 9, 24, 25], "especi": [8, 55], "cuda_visible_devic": [8, 20, 21, 22, 23, 24, 26, 28, 32, 33, 42, 55], "set_visible_devic": [8, 27, 55], "addition": [8, 44, 55], "visibl": [8, 55], "horovod": [8, 27, 55], "scope": [8, 22, 32, 55], "hvd": [8, 27], "sess": [8, 41], "hps_init": 8, "keyword": 8, "dictionari": [8, 50], "demo_model": [8, 15], "demo_model_spars": 8, "sparse_embedding0": [8, 21, 22, 26, 31, 32, 33], "demo_model2": 8, "demo_model2_sparse_0": 8, "demo_model2_sparse_1": 8, "ok": [8, 41, 48], "wrapper": [9, 12, 24], "embedding_lookup_spars": [9, 10, 21, 22], "table_id": [9, 12, 15, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40], "emb_vec_s": [9, 12, 15, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "emb_vec_dtyp": [9, 20, 21, 22, 23, 24, 26], "sparse_lookup_lay": [9, 21, 22, 26], "def": [9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 46, 47, 51], "_infer_step": [9, 20, 21, 26], "embedding_vector": [9, 20, 24, 26, 27, 30, 32, 33, 51], "sp_id": [9, 21, 22, 26], "sp_weight": [9, 21, 22, 26], "enumer": [9, 20, 21, 22, 24, 26, 27, 28, 33, 40, 41, 46, 47, 51], "max_norm": [9, 55], "op": [9, 24, 30, 31, 32, 33, 42, 50, 51, 55], "canon": 9, "sparsetensor": [9, 21, 22, 26], "aggreg": 9, "int32": [9, 12, 14, 15, 23, 28, 30, 31, 32, 33], "sqrtn": 9, "squar": 9, "root": [9, 19, 25, 29, 30, 34, 35, 42, 43, 47, 48, 53, 55], "clip": [9, 42, 55], "d0": 9, "d1": 9, "self": [9, 10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 38, 41, 43], "3x16": 9, "vector_for_id_1": 9, "vector_for_id_3": 9, "vector_for_id_0": 9, "rais": [9, 27, 40, 41], "typeerror": 9, "neither": 9, "nor": 9, "valueerror": [9, 27], "lookup_lay": [9, 20, 21, 23, 24], "Its": [9, 55], "get_shap": 9, "realiz": [10, 17, 20, 28, 36], "toolkit": [10, 13, 17, 20, 38], "face": 10, "hundr": 10, "gigabyt": 10, "qualiti": 10, "engag": 10, "dozen": 10, "mitig": 10, "volatil": [10, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 55], "tail": [10, 42, 51, 55], "characterist": [10, 30], "hierarchi": 10, "ssd": [10, 18, 55], "subscrib": [10, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "illustr": [10, 36, 55], "sok": [10, 25, 36, 37, 55, 56], "distributedembed": [10, 26], "dissect": 10, "subgraph": 10, "composid": 10, "saver": [10, 26], "dump_to_fil": [10, 26, 27], "sm": [10, 13, 17, 35, 38], "volta": [10, 13, 17, 36, 38], "70": [10, 13, 17, 19, 23, 32, 35, 38, 40, 43, 47, 53], "ture": [10, 13, 17, 36, 38], "amper": [10, 13, 17, 36, 38, 55], "h100": [10, 13, 17, 34, 35, 38], "hopper": [10, 13, 17, 30, 38, 55], "90": [10, 13, 17, 19, 23, 24, 35, 38, 47, 55], "compon": [10, 13, 17, 19, 35, 38, 55], "applic": [10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 41, 42, 46, 47, 48, 53, 55], "portabl": [10, 13, 17, 30, 38], "reproduc": [10, 13, 17, 25, 29, 33, 34, 38, 43], "agnost": [10, 17, 38], "ll": [10, 35, 38, 40, 50, 55], "pull": [10, 13, 17, 19, 35, 38, 48], "rm": [10, 13, 17, 19, 25, 29, 30, 34, 35, 38, 41, 43, 47, 48, 55], "cap": [10, 13, 17, 19, 25, 29, 34, 38, 40, 43], "sys_nic": [10, 13, 17, 19, 25, 29, 34, 38, 43], "python3": [10, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 40, 41, 49], "jupyt": [10, 13, 17, 24, 30, 31, 32, 33, 47, 48, 55], "cover": [10, 30, 41, 46], "migrat": [10, 55], "hps_dlrm_benchmark": [10, 17], "md": [10, 17, 55], "inherit": 12, "modul": [12, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 35, 41, 42, 43, 47, 55], "hps_torch": [12, 13, 28, 29], "__init__": [12, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33], "har": 13, "seamlessli": [13, 55], "catalog": [13, 17, 38], "explor": 13, "visit": [13, 55], "24": [13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 38, 40, 41, 42, 43, 47, 51, 53, 54], "hpsplugin": [14, 16], "registr": [14, 15], "hps_trt": [14, 15, 17, 30, 31, 32, 33, 34], "num_keys_per_sampl": 14, "embedding_vector_s": 14, "hpsplugincr": [14, 15, 16], "registri": 14, "trail": 15, "charact": [15, 21, 24, 26], "np": [15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 47, 48, 49, 50, 51], "pluginfield": 15, "hps_conf": 15, "dtype": [15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 49, 50, 55], "string_": 15, "pluginfieldtyp": 15, "popular": [17, 45], "tf2onnx": [17, 30, 33], "hugectr2onnx": [17, 31, 36, 41, 55], "graphsurgeon": 17, "ld_preload": [17, 24, 30, 31, 32, 33], "usr": [17, 19, 22, 24, 26, 30, 31, 32, 33, 35, 41, 43, 49], "lib": [17, 22, 24, 26, 30, 31, 32, 33, 41, 49], "libhps_plugin": [17, 30, 31, 32, 33], "pytorch": [17, 28, 29, 34, 41, 47, 48], "ctype": [17, 30, 31, 32, 33], "cdll": [17, 30, 31, 32, 33], "rtld_global": [17, 30, 31, 32, 33], "subcompon": 18, "meet": [18, 41], "site": 18, "relationship": [18, 55], "highest": 18, "speed": [18, 30, 33, 36, 40, 55], "benefit": 18, "unifi": [18, 49, 55], "extens": [18, 41, 48, 55], "hugectr_backend": 18, "critic": [19, 20, 21, 22, 23, 24, 26, 30, 33, 41], "hps_profil": 19, "benchmark": [19, 34, 41, 54, 55], "trion": 19, "procedur": [19, 55], "embedding_cach": 19, "num_kei": 19, "p": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 41, 42, 43, 51, 53, 55], "table_s": 19, "630000": 19, "warmup_iter": 19, "900": [19, 28, 40, 41, 51, 53], "000285m": 19, "000384853m": 19, "median": 19, "000365m": 19, "95": [19, 23, 47], "000428m": 19, "99": [19, 23, 47], "000465m": 19, "009736m": 19, "73973e": 19, "010842m": 19, "0117076m": 19, "011596m": 19, "012219m": 19, "016642m": 19, "027379m": 19, "86236": 19, "dedupl": 19, "019159m": 19, "0272492m": 19, "027262m": 19, "028104m": 19, "029548m": 19, "052309m": 19, "36681": 19, "178875m": 19, "231377m": 19, "227815m": 19, "267493m": 19, "284738m": 19, "47672m": 19, "4389": 19, "merg": [19, 30, 35], "007656m": 19, "00850756m": 19, "008434m": 19, "009117m": 19, "011863m": 19, "018697m": 19, "118568": 19, "105163m": 19, "15741m": 19, "153763m": 19, "192302m": 19, "208846m": 19, "402043m": 19, "6503": 19, "52": [19, 23, 31, 40, 41, 47, 51, 53, 55], "021729m": 19, "0227739m": 19, "02253m": 19, "023695m": 19, "025035m": 19, "043024m": 19, "44385": 19, "decompress": 19, "deuniqu": 19, "011247m": 19, "0121274m": 19, "011953m": 19, "013055m": 19, "014706m": 19, "022186m": 19, "83661": 19, "719323": 19, "843972": 19, "854749": 19, "894188": 19, "90276": 19, "918169": 19, "parti": [19, 35, 43, 55], "git": [19, 25, 29, 30, 34, 35, 43, 47, 53], "clone": [19, 30, 35, 47, 53, 55], "cd": [19, 25, 29, 30, 34, 35, 38, 40, 41, 43, 47, 48, 53], "submodul": [19, 35, 43, 53], "recurs": [19, 35, 43, 53], "ngc": [19, 36, 47, 49, 53, 55], "mount": [19, 25, 29, 34, 43, 47], "pwd": [19, 25, 29, 30, 34, 41, 43, 47, 48], "8888": [19, 25, 29, 30, 34, 43], "mkdir": [19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 43, 46, 51, 53], "cmake": [19, 35, 36, 43, 50, 53, 55], "dcmake_build_typ": [19, 35, 43, 53], "dsm": [19, 35, 43, 53, 55], "denable_infer": [19, 30, 35], "ON": [19, 30, 35, 36, 43, 53, 55], "denable_profil": 19, "j": [19, 21, 22, 26, 32, 33, 35, 43, 53], "exit": [19, 41], "hotkei": 19, "histogram": 19, "100000": [19, 22], "hot_key_percentag": 19, "hot_key_coverag": 19, "test": [19, 30, 35, 41, 42, 45, 53, 54, 55], "discard": 19, "database_backend": [19, 55], "vdb": 19, "pdb": 19, "refresh_embeddingcach": 19, "lookup_sess": 19, "e2": 19, "model_sampl": 19, "190813m": 19, "243117m": 19, "238085m": 19, "283761m": 19, "346377m": 19, "511712m": 19, "4200": [19, 51], "075086m": 19, "127312m": 19, "121235m": 19, "166826m": 19, "219295m": 19, "285409m": 19, "8248": 19, "44": [19, 23, 26, 30, 32, 33, 40, 41, 47, 51, 53], "xx": [19, 55], "mutual": [19, 30], "accur": 19, "don": [19, 35, 55], "prepar": [19, 38, 50, 51, 55], "everyth": [19, 55], "tritonserv": [19, 24, 30, 31, 32, 33], "your_model_nam": 19, "perf_output": 19, "csv": [19, 45, 46, 49, 50], "verbos": [19, 24, 30, 32, 35, 55], "your_generated_request": 19, "pipelin": [19, 36, 54, 55], "pofil": 19, "copyright": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "2021": [20, 21, 22, 23, 24, 26, 27, 28, 37, 40, 42, 53], "corpor": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "right": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "licens": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "complianc": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "www": [20, 21, 22, 23, 24, 26, 27, 28, 33, 40, 42, 53], "org": [20, 21, 22, 23, 24, 26, 27, 28, 33, 38, 40, 42, 45, 48, 49, 53, 55], "agre": [20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 41, 42, 53], "AS": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "warranti": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "OR": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 54], "OF": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "languag": [20, 21, 22, 23, 24, 26, 27, 28, 37, 40, 42, 53], "govern": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "permiss": [20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 42, 53], "intend": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "preinstal": [20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 53], "naiv": [20, 23], "neural": [20, 21, 22, 23, 24, 26, 30, 36, 38, 41, 50, 51], "gpu_num": [20, 21, 22, 24, 26, 27, 32, 33], "iter_num": [20, 21, 22, 24, 26, 27, 32, 33], "vocabulary_range_per_slot": [20, 21, 22, 24, 26, 27, 32, 33], "naive_dnn": 20, "dense_model_path": [20, 21, 22, 24, 26, 27], "naive_dnn_dens": 20, "embedding_table_path": [20, 21, 22, 24, 26, 27, 32, 33], "naive_dnn_spars": 20, "saved_path": [20, 21, 22, 24, 26, 27, 33], "naive_dnn_tf_saved_model": 20, "np_key_typ": [20, 21, 22, 24, 26, 27, 32, 33], "np_vector_typ": [20, 21, 22, 24, 26, 27, 32, 33], "tf_key_typ": [20, 21, 22, 23, 24, 26, 27, 33], "tf_vector_typ": [20, 21, 22, 24, 26, 27, 33], "join": [20, 21, 22, 23, 24, 26, 28, 30, 32, 33, 41, 42, 45, 46, 50, 51], "generate_random_sampl": [20, 21, 22, 24, 26, 27, 32, 33], "key_dtyp": [20, 21, 22, 24, 26, 32, 33], "vocab_rang": [20, 21, 22, 23, 24, 26, 28, 32, 33], "keys_per_slot": [20, 21, 24, 32, 33], "randint": [20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33], "tf_dataset": [20, 21, 22, 24, 26, 27, 33], "from_tensor_slic": [20, 21, 22, 24, 26, 27, 33], "drop_remaind": [20, 21, 22, 24, 26, 27, 33], "trainmodel": [20, 21, 24], "init_tensor": [20, 22, 24, 26, 30, 32, 33], "super": [20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33], "initial_valu": [20, 21, 22, 24, 30, 33], "fc_1": [20, 21, 24], "kernel_initi": [20, 21, 23, 24], "ones": [20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "bias_initi": [20, 21, 23, 24], "fc_2": [20, 21, 24], "logit": [20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "learning_r": [20, 21, 22, 24, 26, 27, 33, 36], "loss_fn": [20, 21, 22, 24, 26, 27, 33], "binarycrossentropi": [20, 21, 22, 24, 26, 27, 33], "from_logit": [20, 21, 22, 24, 26], "_train_step": [20, 21, 22, 24, 26, 27, 33], "gradienttap": [20, 21, 22, 24, 26, 27, 33], "tape": [20, 21, 22, 24, 26, 27, 33], "grad": [20, 21, 22, 24, 26, 33], "trainable_vari": [20, 21, 22, 24, 26, 27, 33], "apply_gradi": [20, 21, 22, 24, 26, 27, 33], "zip": [20, 21, 22, 24, 26, 27, 33, 45, 46], "id_tensor": 20, "trained_model": [20, 21, 22, 24, 26, 27, 32, 33], "weights_list": [20, 21, 22, 24, 33], "get_weight": [20, 21, 22, 24, 33], "embedding_weight": [20, 22, 24, 32, 33], "dense_model": [20, 21, 24, 26, 27, 31, 41], "get_lay": [20, 21, 24, 26, 27], "2022": [20, 21, 22, 24, 26, 27, 31, 37, 40, 53, 55], "07": [20, 21, 22, 23, 26, 27, 32, 33, 40, 41, 42, 44, 47, 51, 53], "742983": 20, "platform": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 34, 37, 41, 55], "cpu_feature_guard": [20, 21, 22, 23, 24, 26, 30, 33, 41], "cc": [20, 21, 22, 23, 24, 26, 27, 30, 33, 41], "151": [20, 21, 22, 26], "oneapi": [20, 21, 22, 23, 24, 26, 30], "onednn": [20, 21, 22, 23, 24, 26, 30], "avx2": [20, 21, 22, 26, 41], "fma": [20, 21, 22, 26, 41], "rebuild": [20, 21, 22, 23, 24, 26, 30, 33, 41, 55], "appropri": [20, 21, 22, 23, 24, 26, 30, 33, 41], "present": [20, 21, 22, 24, 30, 33], "track": [20, 21, 22, 24, 30, 33, 41], "strong": [20, 21, 22, 24, 30, 33], "rewritten": [20, 21, 22, 24, 30, 33], "subclass": [20, 21, 22, 24, 30, 33], "_________________________________________________________________": [20, 21, 26], "input_1": [20, 21, 22, 23, 24, 26], "inputlay": [20, 21, 22, 23, 24, 26, 30, 33], "embedding_l": 20, "ookup": 20, "tfoplambda": [20, 21, 22, 23, 24, 26, 30, 33], "48": [20, 21, 23, 26, 30, 32, 33, 40, 41, 47, 51], "12544": [20, 21], "257": [20, 21, 22, 24, 26, 30], "801": [20, 40], "trainabl": [20, 21, 22, 23, 24, 26, 30, 31, 33, 40, 41, 42, 44, 53], "57": [20, 22, 23, 30, 33, 40, 42, 47, 51, 53], "326494": 20, "common_runtim": [20, 21, 22, 23, 24, 26, 33, 41], "gpu_devic": [20, 21, 22, 23, 24, 26, 33, 41], "1525": [20, 21, 22, 26], "replica": [20, 21, 22, 23, 24, 26, 33, 41], "30989": [20, 21, 22, 26], "mb": [20, 21, 22, 23, 24, 26, 33, 41, 50], "tesla": [20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 51, 53], "sxm2": [20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 51, 53], "bu": [20, 21, 22, 23, 24, 26, 33, 40, 41], "0000": [20, 21, 22, 23, 24, 26, 33, 40, 41, 42], "00": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 40, 41, 47, 48, 51, 53], "6136": 20, "6875": 20, "4463": 20, "05712890625": 20, "3192": 20, "029296875": 20, "2180": 20, "40283203125": 20, "1419": 20, "980712890625": 20, "879": [20, 40, 42], "0396728515625": 20, "513": [20, 42], "3021240234375": 20, "272": [20, 31, 41], "9712219238281": 20, "129": 20, "147705078125": 20, "21624755859375": 20, "model_1": [20, 21, 22, 24, 26, 30], "input_2": [20, 21, 22, 23, 24, 26], "compile_metr": [20, 21, 24, 26], "645703": 20, "368": [20, 21, 26, 28, 33, 40, 41], "asset": [20, 21, 24, 26, 30, 33], "readi": [20, 21, 24, 26, 30, 31, 32, 33, 40, 49, 53], "load_model": [20, 21, 23, 24, 26], "create_and_save_inference_graph": [20, 21, 24, 26], "convert_to_sparse_model": [20, 21, 22, 24, 32, 33], "embeddings_weight": [20, 21, 22, 24, 32, 33], "wb": [20, 21, 22, 23, 24, 28, 30, 31, 32, 33, 46, 47, 48, 51], "key_fil": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec_fil": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec": [20, 21, 22, 23, 24, 28, 32, 33, 51], "key_struct": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec_struct": [20, 21, 22, 23, 24, 28, 32, 33, 51], "wa": [20, 21, 22, 23, 24, 26, 30, 35, 36, 40, 42, 43, 50, 53, 54, 55], "model_2": [20, 21, 24], "input_3": [20, 21, 22, 23, 24, 26], "reshape_1": [20, 21, 22, 23, 24], "12801": 20, "necessari": [20, 21, 26, 30, 35, 55], "peek": [20, 21, 26], "writefil": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 40, 41, 42, 51, 53], "inference_with_saved_model": [20, 21, 26], "embedding_vectors_peek": 20, "id_tensors_peek": 20, "pars": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 55], "hctr": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 53, 55], "25": [20, 21, 23, 28, 32, 33, 40, 42, 47, 50, 51, 53], "009": [20, 40], "rk0": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 53, 55], "main": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 40, 41, 42, 50, 53, 55], "010": [20, 40, 53], "db": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "357": 20, "hps_et": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "preallocatedhashmapbackend": [20, 21, 22, 26], "18446744073709551615": [20, 21, 22, 23, 24, 26, 31, 32, 33, 41], "363": [20, 40, 47], "000000": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 49, 51, 53], "405": 20, "23265739": 20, "11092357": 20, "09594781": 20, "16974597": 20, "22555737": 20, "20454781": 20, "22397298": 20, "1229516": 20, "12451896": 20, "21348731": 20, "11943579": 20, "2502464": 20, "5283": 20, "17773": 20, "26371": 20, "5043": 20, "17928": 20, "22941": 20, "5154": 20, "18816": 20, "28670": 20, "9014": 20, "16185": 20, "22256": 20, "9893": 20, "14515": 20, "25771": 20, "5377": 20, "18265": 20, "28063": 20, "hierarchical_parameter_server_demo": [21, 22, 23, 24, 25, 26, 27], "dive": [21, 22, 23, 24, 26, 27, 37], "slot_num_per_t": 21, "embed_vec_size_per_t": 21, "max_vocabulary_size_per_t": 21, "vocabulary_range_per_slot_per_t": 21, "max_nnz_per_slot_per_t": 21, "multi_table_sparse_input_dens": 21, "multi_table_sparse_input": 21, "multi_table_sparse_input_sparse_0": 21, "multi_table_sparse_input_sparse_1": 21, "multi_table_sparse_input_tf_saved_model": 21, "generate_sparse_kei": [21, 22, 26], "max_nnz_per_slot": 21, "max_nnz_of_all_slot": 21, "max_nnz": [21, 22, 26, 27, 55], "sort": [21, 22, 26, 41, 46, 50], "choic": [21, 22, 26, 40], "dense_shap": [21, 22, 26], "generate_dense_kei": 21, "dense_kei": 21, "assert": [21, 23, 28, 47, 55], "sparse_kei": [21, 22, 26, 27], "init_tensors_per_t": 21, "max_nnz_of_all_slots_per_t": 21, "el": 21, "params0": 21, "params1": 21, "input_shap": 21, "fc_3": 21, "embeddings0": 21, "embeddings1": 21, "math": [21, 30, 55], "embedding_weights_per_t": 21, "51": [21, 23, 40, 41, 42, 47, 51, 53], "09": [21, 30, 41, 42, 47, 51, 53], "676041": 21, "271131": 21, "__________________________________________________________________________________________________": [21, 22, 23, 24, 26, 30, 33], "embedding_look": [21, 22, 24, 30, 33], "up_spars": [21, 22], "embedding_looku": [21, 22, 24, 30, 33], "p_spars": [21, 22], "16640": 21, "29": [21, 22, 23, 26, 27, 30, 32, 33, 40, 41, 42, 47, 51, 53], "441": [21, 41, 47], "14588": 21, "11693": 21, "8232": 21, "9658203125": 21, "6276": 21, "9736328125": 21, "4676": 21, "82861328125": 21, "2921": 21, "1875": 21, "1938": 21, "2447509765625": 21, "1093": 21, "598388671875": 21, "616": 21, "3092651367188": 21, "61248779296875": 21, "input_4": [21, 22, 23, 24], "335404": 21, "absl": [21, 24, 26, 33], "_wrapped_model": [21, 24, 26], "args_0": [21, 24, 26], "unsupport": [21, 24, 26], "renam": [21, 24, 26, 50, 55], "args_0_1": [21, 24, 26], "input_5": [21, 23, 24], "input_6": [21, 23, 24], "sparseloo": [21, 22, 26], "kuplay": [21, 22, 26], "reshape_2": [21, 23], "reshape_3": [21, 23], "29441": 21, "args_0_3": [21, 26], "embeddings0_peek": 21, "embeddings1_peek": 21, "inputs_peek": [21, 26], "2nd": [21, 40], "495": 21, "855": [21, 47], "33": [21, 23, 26, 30, 31, 32, 33, 40, 42, 47, 51, 53], "195": [21, 30, 47], "201": [21, 47, 53], "212": [21, 28, 41], "9905": 21, "1750": 21, "4223": 21, "20477": 21, "22119": 21, "23797": 21, "6111": 21, "9122444": 21, "76979905": 21, "7415885": 21, "66938084": 21, "90488005": 21, "7773342": 21, "6368773": 21, "276": [21, 47], "1610": 21, "408": [21, 30, 32, 40, 42, 53], "1884": 21, "678": [21, 28, 47], "1762": 21, "369": [21, 40], "1794": 21, "403": 21, "1216": 21, "909": 21, "1427": 21, "28882617": 21, "41947648": 21, "597903": 21, "37505823": 21, "70420146": 21, "38864705": 21, "32224336": 21, "31987724": 21, "43596342": 21, "5383081": 21, "37384593": 21, "6026224": 21, "dnn_dens": 22, "dnn_spars": 22, "dnn_tf_saved_model": 22, "dense_featur": [22, 24, 26, 27], "astyp": [22, 23, 24, 26, 27, 28, 31, 32, 33, 42, 50], "fc3": [22, 30, 40, 42, 51, 53], "input_cat": [22, 26], "input_dens": [22, 26, 27], "concat_fea": 22, "mirroredstrategi": [22, 55], "_replica_loss": 22, "compute_average_loss": 22, "_reshape_input": 22, "_dataset_fn": 22, "input_context": 22, "replica_batch_s": 22, "get_per_replica_batch_s": 22, "num_input_pipelin": 22, "input_pipeline_id": 22, "distribute_datasets_from_funct": 22, "41": [22, 23, 30, 32, 33, 40, 41, 47, 48, 51, 53], "55": [22, 23, 30, 33, 41, 42, 47, 51, 53], "554588": 22, "606412": 22, "608128": 22, "609468": 22, "0a": [22, 40, 41], "610818": 22, "0b": [22, 40, 41], "160": [22, 31, 47, 51], "170": [22, 31, 32], "175104": 22, "262400": [22, 30], "437": [22, 28, 31, 41, 47], "761": [22, 30], "eagerli": 22, "call_for_each_replica": 22, "experimental_run": 22, "dist": [22, 24, 26, 32, 49], "1082": [22, 26, 40], "userwarn": [22, 26, 42, 50], "binary_crossentropi": [22, 26], "dispatch_target": [22, 26], "batch_all_reduc": 22, "num_pack": 22, "allreduc": 22, "indexedslic": 22, "broadcast": 22, "perreplica": 22, "1950232": 22, "20766959": 22, "2006835": 22, "21188965": 22, "681": [22, 31, 47], "73474": 22, "691": 22, "33826": 22, "588": [22, 40, 42], "15265": 22, "622": [22, 47], "72485": 22, "9260483": 22, "509967": 22, "0374002": 22, "1059036": 22, "002458": 22, "7079678": 22, "333396": 22, "6451607": 22, "_apply_all_reduc": 22, "_all_reduc": 22, "0x7fba4c2dc1f0": 22, "retrac": [22, 33], "trace": [22, 32, 33, 55], "expens": [22, 33], "excess": [22, 33], "pass": [22, 30, 31, 32, 33, 41, 47, 55], "instead": [22, 24, 33, 38, 41, 55], "outsid": [22, 33, 55], "experimental_relax_shap": 22, "relax": 22, "unnecessari": [22, 33, 55], "controlling_retrac": [22, 33], "api_doc": [22, 33], "8326673": 22, "79405844": 22, "85364443": 22, "92679256": 22, "0x7fba4c2dcdc0": 22, "5796976": 22, "54752666": 22, "57471323": 22, "54845804": 22, "61678064": 22, "647662": 22, "6421599": 22, "6278339": 22, "28049487": 22, "2768654": 22, "2943622": 22, "2805586": 22, "2102679": 22, "368755": 22, "4997649": 22, "5143406": 22, "413176": 22, "42411563": 22, "38453132": 22, "4314984": 22, "pretrainedembed": 22, "fc": [22, 23, 47, 54], "new_fc": 22, "train_with_pretrained_embed": 22, "707": [22, 47], "17": [22, 23, 26, 27, 32, 33, 41, 47, 51, 53, 55], "153": 22, "177": [22, 30, 33], "180": [22, 33], "188": [22, 31, 42], "191": [22, 47, 53], "197": 22, "concat_1": [22, 32], "171": [22, 30, 31, 41], "17934436": 22, "17969523": 22, "18917403": 22, "18102707": 22, "7858478": 22, "68311": 22, "66279": 22, "5826445": 22, "7325904": 22, "7331751": 22, "7210605": 22, "7671325": 22, "62144834": 22, "5696643": 22, "5946336": 22, "64713424": 22, "88115656": 22, "9079187": 22, "98161024": 22, "97925556": 22, "6572284": 22, "6304919": 22, "66552734": 22, "6695935": 22, "2002374": 22, "19162768": 22, "1874283": 22, "19209734": 22, "5284709": 22, "6028371": 22, "5635803": 22, "5773235": 22, "74001855": 22, "71915305": 22, "619328": 22, "7890761": 22, "55197906": 22, "5565746": 22, "52792": 22, "6230979": 22, "templat": [23, 38], "emebed": 23, "off": [23, 35, 40, 55], "create_model_for_table_fus": 23, "pytest": [23, 28], "vocab_s": [23, 28], "num_query_kei": [23, 28], "num_it": [23, 28], "list_physical_devic": [23, 27], "set_memory_growth": [23, 27], "set_inter_op_parallelism_thread": 23, "hps_config": [23, 28], "_tabl": [23, 28], "generate_embedding_t": [23, 28], "hugectr_sparse_model": [23, 28, 51], "00025": 23, "set_up_model_fil": [23, 28], "table_nam": [23, 27, 28, 55], "model_file_nam": [23, 28], "concat_embed": 23, "create_savedmodel": 23, "hps_config_json_object": [23, 28], "indent": [23, 28], "outfil": [23, 28], "__name__": [23, 30, 41], "__main__": [23, 30, 32, 41], "2023": [23, 30, 32, 33, 40, 41, 42, 55], "03": [23, 30, 32, 33, 40, 42, 44, 47, 49, 50, 51, 53], "28": [23, 24, 30, 32, 33, 40, 42, 47, 51, 53], "206281": 23, "194": [23, 24, 28, 30], "sse3": [23, 24, 26, 30, 33], "sse4": [23, 24, 26, 30, 33], "avx": [23, 24, 26, 30, 33], "36": [23, 24, 30, 31, 32, 33, 40, 47, 51, 53], "420084": 23, "926162": 23, "1637": 23, "30996": 23, "input_7": [23, 24], "input_8": 23, "embedding_lookup0": 23, "embedding_lookup1": 23, "embedding_lookup2": 23, "embedding_lookup3": 23, "embedding_lookup4": 23, "embedding_lookup5": 23, "embedding_lookup6": 23, "embedding_lookup7": 23, "3328": [23, 32], "reshape_4": 23, "reshape_5": 23, "reshape_6": 23, "reshape_7": 23, "26624": 23, "26625": 23, "625": 23, "38": [23, 30, 31, 32, 33, 41, 47, 51, 53], "079": 23, "use_static_t": [23, 28, 30, 31, 32, 33], "8_tabl": [23, 28], "080": [23, 40], "blank": [23, 24, 28, 30, 31, 32, 33, 41], "547": [23, 40, 47], "table0": [23, 28], "hashmapbackend": [23, 24, 31, 32, 33, 41], "39": [23, 26, 32, 33, 40, 47, 51, 53, 54], "379": [23, 40, 42, 47], "830": 23, "40": [23, 30, 32, 33, 40, 41, 42, 47, 51, 53], "448": 23, "table3": [23, 28], "899": [23, 40, 45], "table4": [23, 28], "934": [23, 40], "table5": [23, 28], "43": [23, 26, 32, 33, 41, 47, 48, 53], "097": [23, 30, 40, 42], "table6": [23, 28], "296": [23, 28, 41, 45, 55], "table7": [23, 28], "297": [23, 47], "306": [23, 45, 53], "469": 23, "470": [23, 47], "ec": [23, 24, 28, 30, 31, 32, 33, 55], "475": [23, 28, 47], "lookupsess": [23, 28, 30, 33, 41], "inputs_seq": [23, 28], "elaps": [23, 28], "918038": 23, "325440": 23, "818316": 23, "756": [23, 28, 40], "hps_database_backend": [23, 28], "html": [23, 24, 28, 30, 31, 32, 33, 41, 48, 50, 55], "292": [23, 40, 53], "fused_embedding0": [23, 28], "80000": 23, "299": [23, 26, 31, 40], "406": [23, 40, 47], "407": [23, 40, 41, 47, 53], "14": [23, 24, 30, 31, 32, 33, 40, 41, 42, 47, 49, 51, 53], "19": [23, 32, 33, 40, 41, 42, 47, 51, 53], "21": [23, 30, 32, 33, 41, 47, 49, 51, 53], "27": [23, 26, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53], "30": [23, 26, 32, 33, 40, 41, 47, 50, 51, 53, 55], "35": [23, 31, 32, 33, 40, 47, 51, 53], "37": [23, 24, 30, 31, 32, 33, 40, 41, 42, 47, 53], "46": [23, 31, 32, 33, 40, 41, 42, 47, 51], "47": [23, 31, 32, 33, 41, 47, 51], "54": [23, 30, 31, 32, 40, 41, 42, 47, 51, 53], "60": [23, 26, 27, 35, 38, 47, 53], "62": [23, 42, 45, 47], "63": [23, 31, 47, 53], "65": [23, 47], "66": [23, 24, 47], "68": [23, 47, 50], "69": [23, 47], "73": [23, 26, 30, 32, 47], "74": [23, 30, 47], "77": [23, 40, 42, 47], "78": [23, 47], "79": [23, 42, 47], "81": [23, 47], "82": [23, 47], "83": [23, 40, 47], "84": [23, 26, 40, 47], "85": [23, 24, 26, 30, 40, 41, 47], "87": [23, 47], "88": [23, 47], "89": [23, 24, 40, 41, 47], "91": [23, 42, 47], "92": [23, 30, 47], "93": [23, 47], "96": [23, 47], "97": [23, 42, 47], "9442901611328125": 23, "hps_tf_triton_dens": 24, "hps_tf_triton": 24, "hps_tf_triton_sparse_0": 24, "hps_tf_triton_tf_saved_model": 24, "requestsdependencywarn": 24, "urllib3": 24, "chardet": 24, "doesn": [24, 42, 55], "concated_featur": 24, "919938": 24, "444040": 24, "1532": 24, "30991": 24, "23296": 24, "553": [24, 30, 40, 47], "10934": 24, "333984375": 24, "9218": 24, "0703125": 24, "7060": 24, "255859375": [24, 33], "5094": 24, "876953125": 24, "3605": 24, "475830078125": 24, "2593": 24, "270751953125": 24, "1741": 24, "0677490234375": 24, "1045": 24, "5091552734375": 24, "541": [24, 30, 40, 47], "4227905273438": 24, "242": [24, 47], "8596649169922": 24, "hps_tf": [24, 25], "model_repo": [24, 30, 31, 32, 33], "triton_model_repo": 24, "23553": 24, "pbtxt": [24, 30, 31, 32, 33], "mv": [24, 26, 27, 30, 31, 32, 33], "tensorflow_savedmodel": 24, "data_typ": [24, 30, 31, 32, 33], "type_int64": 24, "type_fp32": [24, 30, 31, 32, 33], "output_1": [24, 30, 33], "version_polici": 24, "instance_group": [24, 30, 31, 32, 33], "kind_gpu": [24, 30, 31, 32, 33], "tree": [24, 30, 31, 32, 33, 50, 55], "34mmodel_repo": [24, 31, 32, 33], "00m": [24, 31, 32], "34m1": [24, 31, 32, 33], "34mmodel": 24, "34masset": 24, "keras_metadata": 24, "pb": 24, "saved_model": [24, 30, 33], "34mvariabl": 24, "00000": 24, "34mhps_tf_triton_sparse_0": 24, "background": [24, 30, 31, 32, 33, 41, 55], "merlin_hp": 24, "py3": 24, "x86_64": [24, 31, 41], "egg": 24, "libhierarchical_parameter_serv": 24, "curl": 24, "format_non": 24, "is_shape_tensor": 24, "allow_ragged_batch": 24, "label_filenam": 24, "batch_input": 24, "batch_output": 24, "prioriti": [24, 54], "priority_default": 24, "input_pinned_memori": 24, "output_pinned_memori": 24, "gather_kernel_buffer_threshold": 24, "eager_batch": 24, "dynamic_batch": 24, "preferred_batch_s": 24, "max_queue_delay_microsecond": 24, "preserve_ord": 24, "priority_level": 24, "default_priority_level": 24, "priority_queue_polici": 24, "hps_tf_triton_0": 24, "secondary_devic": 24, "profil": [24, 30, 31, 32, 33, 44, 55], "passiv": 24, "host_polici": 24, "default_model_filenam": [24, 30, 31, 32, 33], "cc_model_filenam": 24, "metric_tag": 24, "model_warmup": 24, "tritoncli": [24, 31, 32, 33], "httpclient": [24, 31, 32, 33], "send_inference_request": 24, "num_request": 24, "triton_cli": 24, "inferenceservercli": [24, 31, 32, 33], "is_server_l": 24, "get_model_repository_index": 24, "key_tensor": [24, 41], "dense_tensor": 24, "inferinput": [24, 31, 32, 33], "np_to_triton_dtyp": [24, 31, 32, 33], "set_data_from_numpi": [24, 31, 32, 33], "inferrequestedoutput": [24, 31, 32, 33], "get_respons": [24, 31, 32, 33], "health": 24, "httpsocketpoolrespons": 24, "plain": 24, "post": [24, 54], "bytearrai": 24, "model_vers": [24, 31, 32, 33], "binary_data_s": [24, 31, 32, 33], "fall": 24, "trt_convert": 24, "original_model_path": 24, "new_model_path": 24, "instanti": [24, 50], "trtgraphconverterv2": 24, "input_saved_model_dir": 24, "precision_mod": 24, "trtprecisionmod": 24, "trt_func": 24, "convert_to_tensor": [24, 27], "input_fn": 24, "yield": 24, "output_saved_model_dir": 24, "clear": [24, 30, 32, 33, 50], "prior": [24, 30, 33], "924379": 24, "grappler": 24, "elig": 24, "924537": 24, "single_machin": 24, "928272": 24, "deactiv": 24, "028482": 24, "028568": 24, "061909": 24, "068593": 24, "tf2tensorrt": 24, "trt_optimization_pass": 24, "198": 24, "calibr": 24, "use_calibr": 24, "069761": 24, "952": [24, 40], "noop": 24, "1x": 24, "nonconvert": 24, "deeplearn": 24, "069860": 24, "tf_trt_max_allowed_engin": 24, "minimum_segment_s": 24, "069893": 24, "convert_graph": 24, "799": [24, 30, 40, 47], "candid": 24, "060667": 24, "916": [24, 40], "trtengineop_000_000": 24, "trtengineop": 24, "biasadd": 24, "concatv2": 24, "const": [24, 30, 33, 41], "matmul": [24, 26, 27, 32, 33], "329": [24, 41, 47, 53], "745": [24, 33, 40], "753": [24, 41, 47], "200000": [24, 31, 32, 33], "778": [24, 47], "814": [24, 31, 47], "815": 24, "818078": 24, "104": [24, 28, 42, 47], "818150": 24, "106": [24, 30, 41], "749149": 24, "convert_nod": 24, "1275": 24, "814132": 24, "trt_logger": [24, 30, 31, 32, 33], "defaultlogg": 24, "cpp": [24, 30, 31, 32, 33, 41, 55], "cublaswrapp": 24, "cubla": [24, 30, 31, 32, 33], "817575": 24, "trt_engine_op": 24, "1061": [24, 33], "creation": 24, "817694": 24, "894": [24, 41], "823806": 24, "34m2": 24, "serial": 24, "numba": [24, 30, 33, 42], "select_devic": [24, 30, 33], "close": [24, 30, 33], "rememb": [24, 30, 35], "kill": 24, "again": [24, 30, 55], "simplest": [25, 29, 34, 43], "isol": [25, 29, 34, 43], "repetit": [25, 29, 34, 43], "prefer": [25, 28, 29, 34], "notebookapp": [25, 29, 34, 43, 48], "token": [25, 29, 34, 43, 48], "web": [25, 29, 30, 34, 37, 43, 55], "browser": [25, 29, 30, 34, 43], "aae96ae9387cd28151868fee318c3b3581a2d794f3b25c6b": [25, 29, 34, 43], "hps_multi_table_sparse_input_demo": 25, "hps_pretrained_model_training_demo": 25, "mirror": [25, 55], "sok_to_hps_dlrm_demo": 25, "sparseoperationkit": [25, 26, 27, 55], "hps_table_fusion_demo": 25, "author": [25, 29, 34, 37, 41, 43], "intel": [25, 29, 34, 43, 54], "xeon": [25, 29, 34, 43, 54], "e5": [25, 29, 34, 43, 54], "2698": [25, 29, 34, 43, 54], "v4": [25, 29, 34, 43, 54, 55], "20ghz": [25, 29, 34, 43, 54], "kingslei": [25, 29, 34, 37, 43], "liu": [25, 29, 34, 37, 43], "hierarchicalparameterserv": [26, 27], "sparse_operation_kit_demo": [26, 27, 55], "sparse_operation_kit": [26, 27, 35, 43, 55], "sy": [26, 27, 30, 33, 41, 42, 47, 50], "unit_test": 26, "test_script": 26, "tf2": 26, "260000": [26, 27, 31, 32, 33], "dlrm_dens": [26, 27], "dlrm_spars": [26, 27, 30], "dlrm_tf_saved_model": [26, 27, 33], "plugin_adam": 26, "arch": [26, 27, 32, 33], "out_activ": [26, 27, 32, 33], "secondorderfeatureinteract": [26, 27, 32, 33], "self_interact": [26, 27], "dot_product": [26, 27, 32, 33], "transpose_b": [26, 27, 33], "ones_lik": [26, 27], "linalg": [26, 27], "band_part": [26, 27], "flat_interact": [26, 27, 32, 33], "boolean_mask": [26, 27], "max_vocabulary_size_per_gpu": [26, 55], "arch_bot": [26, 27, 32, 33], "arch_top": [26, 27, 32, 33], "embedding_lay": [26, 27], "bot_nn": [26, 27, 33], "top_nn": [26, 27, 33], "interaction_op": [26, 27, 33], "interaction_out_dim": [26, 27, 32, 33], "els": [26, 27, 40, 41, 42, 47, 49, 51], "reshape_layer1": [26, 27, 33], "dense_x": [26, 27, 32, 33], "concat_featur": [26, 27, 30, 32, 33], "z": [26, 27, 32, 33], "emb_opt": 26, "get_embedding_optim": 26, "dense_opt": [26, 27], "get_dense_optim": 26, "embedding_sav": [26, 27], "load_embedding_valu": 26, "embedding_vari": [26, 27], "other_vari": 26, "split_embedding_variable_from_oth": 26, "emb_grad": 26, "optimizerscop": 26, "experimental_aggregate_gradi": 26, "793169": 26, "152": [26, 42], "323141": 26, "gpu_bfc_alloc": 26, "allow_growth": 26, "tf_force_gpu_allow_growth": 26, "323214": 26, "30997": 26, "078977": 26, "kit_cc": [26, 27], "kit_cc_infra": [26, 27], "src": [26, 27, 41], "107": 26, "local_replica_id": 26, "109": 26, "4287744788": 26, "raw_manag": [26, 27], "132": [26, 30, 53], "embeddingvari": [26, 27], "raw_param": 26, "120": [26, 31, 41, 47], "global_replica_id": 26, "137": [26, 28, 47], "facad": 26, "225": [26, 40, 47], "378": [26, 42, 53], "temporari": 26, "kit_cc_impl": [26, 27], "dumping_funct": [26, 27], "num_total_kei": 26, "total_max_vocabulary_s": 26, "350": 26, "upload": 26, "loop_num": 26, "260": 26, "235": [26, 40], "9379717111587524": 26, "12726": 26, "013671875": 26, "78772735595703": 26, "33247375488281": 26, "48320770263672": 26, "234": [26, 30], "79978942871094": 26, "6663873195648193": 26, "426162719726562": 26, "430748462677002": 26, "768443584442139": 26, "38544": 26, "distributed_embed": 26, "distrib": 26, "4160000": 26, "utedembed": 26, "second_order_feature_interacti": [26, 33], "ion": [26, 33], "second_order_feature_interactio": [26, 33], "127233": 26, "325": [26, 47], "777": [26, 30, 47, 53], "165": 26, "089529": 26, "untrac": [26, 33], "bottom_0_layer_call_fn": [26, 33], "bottom_0_layer_call_and_return_conditional_loss": [26, 33], "bottom_1_layer_call_fn": [26, 33], "bottom_1_layer_call_and_return_conditional_loss": [26, 33], "bottom_2_layer_call_fn": [26, 33], "callabl": [26, 33], "embeddingvariable_kei": [26, 27], "embeddingvariable_valu": [26, 27], "079021": [26, 27], "192": [26, 27, 41], "147": [26, 27, 40, 47], "18360": [26, 27], "rw": [26, 27, 53], "nobodi": [26, 27], "nogroup": [26, 27], "16640000": [26, 27], "jul": [26, 27], "2080000": [26, 27], "911439": 26, "490542": 26, "165777": 26, "043599": 26, "embeddings_peek": 26, "183": [26, 28, 33, 40], "184": 26, "682": 26, "689": 26, "736": [26, 53], "888": [26, 40], "4486": 26, "5745": 26, "255671": 26, "252879": 26, "252045": 26, "145888": 26, "6825647": 26, "6801282": 26, "68074": 26, "68074226": 26, "6818684": 26, "6809397": 26, "3980061": 26, "3981627": 26, "3980992": 26, "78289294": 26, "7833897": 26, "78293324": 26, "78336245": 26, "78305507": 26, "78301686": 26, "880705": 26, "88164043": 26, "88109225": 26, "87982655": 26, "88028604": 26, "88119066": 26, "8650326": 26, "86442304": 26, "86414057": 26, "8642554": 26, "8640611": 26, "8645548": 26, "783202": 26, "78315204": 26, "78240466": 26, "7826805": 26, "78258413": 26, "7824805": 26, "8573375": 26, "85796195": 26, "85979205": 26, "8595341": 26, "85846806": 26, "85798156": 26, "7563881": 26, "7563928": 26, "7564304": 26, "7563316": 26, "7563634": 26, "7564283": 26, "62020814": 26, "6213356": 26, "62018126": 26, "62036": 26, "6201106": 26, "6201722": 26, "85459447": 26, "85330284": 26, "854774": 26, "854769": 26, "8547034": 26, "85447353": 26, "64481944": 26, "6447684": 26, "6449137": 26, "64472693": 26, "64465916": 26, "64503783": 26, "7852191": 26, "78577": 26, "78521436": 26, "7852911": 26, "78544927": 26, "7853453": 26, "6184057": 26, "61849916": 26, "61735946": 26, "61852926": 26, "61921203": 26, "6175788": 26, "7092892": 26, "7092928": 26, "7092843": 26, "70928746": 26, "70928514": 26, "70928574": 26, "6360293": 26, "6360285": 26, "636029": 26, "63602984": 26, "63602865": 26, "63602734": 26, "69062346": 26, "69038725": 26, "690281": 26, "6907744": 26, "6904431": 26, "6903974": 26, "6840397": 26, "684031": 26, "68404853": 26, "6840508": 26, "68404937": 26, "68404216": 26, "7159784": 26, "71973306": 26, "7159706": 26, "7161063": 26, "71603465": 26, "71592766": 26, "67292804": 26, "67351913": 26, "67328465": 26, "67328894": 26, "6733438": 26, "67301095": 26, "68593156": 26, "6859398": 26, "68593466": 26, "6859294": 26, "6859311": 26, "68593705": 26, "72352993": 26, "7230278": 26, "72331727": 26, "72321206": 26, "72359455": 26, "7233958": 26, "60178": 26, "6017275": 26, "60140777": 26, "60140765": 26, "60151523": 26, "6015818": 26, "73245263": 26, "73322636": 26, "7328412": 26, "73278296": 26, "7325789": 26, "7329973": 26, "68950844": 26, "69225705": 26, "6898281": 26, "6889306": 26, "68944615": 26, "69020116": 26, "848309": 26, "84465414": 26, "84872234": 26, "8486877": 26, "84938526": 26, "8492384": 26, "701107": 26, "6997489": 26, "70110285": 26, "700902": 26, "7011098": 26, "70111394": 26, "5723409": 26, "5738345": 26, "5723305": 26, "57233423": 26, "57233775": 26, "572342": 26, "82768726": 26, "82793933": 26, "8282728": 26, "8282294": 26, "82802093": 26, "8280283": 26, "6491487": 26, "64926434": 26, "64963746": 26, "64926565": 26, "64935625": 26, "64957225": 26, "5615084": 26, "56340796": 26, "5635457": 26, "5635438": 26, "5613529": 26, "56135494": 26, "9477315": 26, "94783926": 26, "94776624": 26, "9477597": 26, "9477446": 26, "9477345": 26, "74906373": 26, "7491199": 26, "74906075": 26, "7490612": 26, "7490609": 26, "7490617": 26, "6141995": 26, "6144503": 26, "6139838": 26, "6140719": 26, "6141932": 26, "61409426": 26, "6773844": 26, "67902935": 26, "67736465": 26, "6773715": 26, "6773739": 26, "67744035": 26, "700472": 26, "70258003": 26, "69977176": 26, "70001334": 26, "75941193": 26, "7594471": 26, "75891864": 26, "7593392": 26, "75900066": 26, "75923026": 26, "tf_cpp_min_log_level": 27, "local_batch_s": 27, "1200": [27, 31, 51, 53], "tolist": 27, "sok_backend_typ": 27, "selcet": 27, "hkv": [27, 55], "det": [27, 55], "sparse_model_path": 27, "sok_embedding_table_path": 27, "sok_dlrm_spars": 27, "local_rank": 27, "generate_ragged_tensor_sampl": 27, "embedding_table_s": 27, "lookup_num": 27, "total_indic": 27, "reduce_sum": 27, "raggedtensor": 27, "from_row_length": 27, "total_data": 27, "dynamicvari": [27, 55], "lookup_spars": [27, 55], "sokemblay": 27, "embedding_dim": [27, 51], "var_typ": 27, "table_num": 27, "sok_var": [27, 55], "init_capac": 27, "max_capac": 27, "reshape_layer_list": 27, "sok_reshap": 27, "sok_concat1": 27, "ret_embed": 27, "embed_vec_dim": 27, "embedding_model": 27, "sok_embed": 27, "dense_reshape1": 27, "dense_concat1": 27, "dense_concat2": 27, "input_spars": 27, "sparse_input": 27, "dense_input": [27, 41], "get_embedding_model": 27, "get_embedding_vari": 27, "get_dense_vari": 27, "tmp_var": 27, "sparse_var": 27, "dense_var": 27, "filter_vari": 27, "embedding_load": [27, 55], "opt": [27, 30, 31, 32, 33, 35, 41, 43, 53], "embedding_var": 27, "embedding_dump": [27, 55], "trainer": 27, "distributedgradienttap": 27, "embedding_opt": 27, "optimizerwrapp": [27, 55], "emb_tap": 27, "dense_grad": 27, "embedding_grad": 27, "input_tupl": 27, "dump_model": 27, "du": 28, "lh": 28, "0m": [28, 33, 41, 49], "40m": 28, "multithread": 28, "jit": [28, 33], "fork": [28, 41], "ground": [28, 41], "truth": [28, 41], "modulelist": 28, "keys_list": 28, "annot": 28, "fut": 28, "preds_seq": 28, "preds_seq_gt": 28, "diff": [28, 41], "mse": [28, 41], "05": [28, 30, 31, 42, 44, 45, 46, 47, 49, 51, 53], "836": [28, 40], "839": [28, 47, 53], "use_hctr_cache_implement": [28, 30, 33, 55], "init_ec": [28, 30, 33], "840": [28, 31, 54], "880": [28, 47, 53], "936": 28, "pointer": 28, "975": 28, "018": [28, 33, 40], "041": [28, 40], "059": [28, 40, 42], "070": [28, 40], "088": [28, 40], "113": 28, "123": [28, 40, 41], "167": [28, 30, 41, 47], "196": [28, 31, 47], "210": [28, 34], "223": 28, "239": 28, "252": [28, 41], "284": [28, 40], "307": [28, 45, 47, 53], "319": [28, 40], "336": [28, 30, 53], "360": [28, 47, 53], "390": [28, 40], "409": [28, 40, 42, 53], "446": 28, "453": [28, 41], "515": [28, 30, 47], "535": 28, "560": [28, 47], "580": [28, 40], "597": 28, "606": [28, 40, 53], "615": [28, 40, 47], "624": [28, 33, 47], "632": 28, "668": [28, 40, 47, 53], "695": [28, 47, 53], "712": [28, 53], "725": [28, 47], "740": [28, 53], "768": [28, 40], "783": [28, 31, 40], "794": [28, 40, 47], "821": [28, 47], "844": [28, 47], "861": 28, "890": 28, "920": [28, 31, 47], "929": [28, 41, 42], "938": [28, 41], "957": [28, 31, 47], "979": [28, 40], "006": [28, 40, 53], "016": [28, 40], "027": [28, 40], "037": [28, 40], "046": [28, 40], "056": [28, 40], "064": [28, 33, 41, 42], "085": [28, 42], "095": 28, "110": 28, "125": 28, "136": [28, 47], "163": [28, 40, 47], "173": 28, "231": 28, "249": 28, "250": [28, 40, 41, 47], "10996460914611816": 28, "hps_torch_demo": 29, "plugin_lib_nam": [30, 31, 32, 33], "plugin_handl": [30, 31, 32, 33], "08": [30, 31, 33, 41, 47, 51, 53], "552734": 30, "litemodel": 30, "reduced_embed": 30, "reduce_mean": [30, 41], "keepdim": 30, "numrical_featur": [30, 33], "3fc_light": 30, "embedding_lookup_1": 30, "inputlai": 30, "er": 30, "up_1": 30, "reduce_mean_1": 30, "tfoplam": 30, "bda": 30, "p_1": 30, "141": 30, "145408": 30, "065": 30, "Then": [30, 31, 32, 33, 47, 48], "graphsurgoen": [30, 31, 32, 33], "deeplearningexampl": [30, 47], "quick": [30, 35], "spark": 30, "fast": [30, 50], "verif": 30, "final_output_dir": 30, "frequency_limit": 30, "roughli": 30, "quickli": [30, 50, 55], "haven": 30, "feauture_": 30, "npy": [30, 41], "deploy_path": 30, "hps_model": 30, "memb_vector": 30, "mkei": 30, "light": [30, 36], "enable_pagelock": [30, 33], "577492": 30, "runpi": [30, 33], "runtimewarn": [30, 33], "unpredict": [30, 33], "behaviour": [30, 33], "msg": [30, 33], "462": [30, 47, 53], "protobuf": [30, 33, 55], "extrem": [30, 33, 38], "slow": [30, 33], "1557": [30, 33], "tag": [30, 33, 35, 41, 55], "928": [30, 47], "signatur": [30, 33, 41], "serving_default": [30, 33], "signature_def": [30, 33], "440": [30, 31, 40, 41], "8f8d49": [30, 33], "opset": [30, 33], "459": 30, "fold": [30, 33], "482": [30, 47], "781": [30, 31, 41], "onnx_graphsurgeon": [30, 31, 32, 33], "shape_infer": [30, 31, 32, 33], "import_onnx": [30, 31, 32, 33], "statefulpartitionedcal": [30, 33], "unknown": [30, 32, 33], "hps_node": [30, 32, 33], "attr": [30, 31, 32, 33], "cleanup": [30, 31, 32, 33, 55], "toposort": [30, 31, 32, 33], "export_onnx": [30, 31, 32, 33], "3fc_light_with_hp": 30, "color": 30, "pip": [30, 41, 46, 47, 48, 49, 55], "distinct": 30, "139822124016208": 30, "139821990953120": 30, "unk__6": 30, "logger": [30, 31, 32, 33], "explicit_batch": [30, 31, 32, 33], "networkdefinitioncreationflag": [30, 31, 32, 33], "create_hps_plugin_cr": 30, "trt_version": 30, "__version__": 30, "init_libnvinfer_plugin": 30, "plg_registri": 30, "get_plugin_registri": 30, "plugin_cr": 30, "plugin_creator_list": 30, "hps_plugin_cr": 30, "get_plugin_cr": 30, "build_engine_from_onnx": [30, 31, 32, 33], "onnx_model_path": [30, 31, 32, 33, 41], "builder": [30, 31, 32, 33], "create_network": [30, 31, 32, 33], "onnxpars": [30, 31, 32, 33], "create_builder_config": [30, 31, 32, 33], "builder_config": [30, 31, 32, 33], "rb": [30, 31, 32, 33, 46, 48, 49], "set_flag": 30, "builderflag": [30, 33], "create_optimization_profil": [30, 31, 32, 33], "set_shap": [30, 31, 32, 33], "add_optimization_profil": [30, 31, 32, 33], "build_serialized_network": [30, 31, 32, 33], "serialized_engin": [30, 31, 32, 33], "dynamic_3fc_light": 30, "fout": [30, 31, 32, 33], "memusagechang": [30, 31, 32, 33], "974": [30, 40], "2531": 30, "661": 30, "2943": 30, "735": 30, "lazi": [30, 31, 32, 33, 55], "regist": [30, 31, 32, 33, 46], "plugin_vers": [30, 31, 32, 33], "plugin_namespac": [30, 31, 32, 33], "116": [30, 31, 40, 53], "117": [30, 47], "140": [30, 41], "227": [30, 32, 47], "ktf32": [30, 33], "0088975": 30, "cublaslt": [30, 31, 32, 33, 55], "2952": 30, "12129": 30, "349": [30, 53], "190": 30, "3301": 30, "12319": 30, "against": 30, "persist": [30, 31, 32, 33, 40, 55], "16672": 30, "memusagestat": [30, 31, 32, 33], "1248": 30, "blockassign": [30, 31, 32, 33], "shift": [30, 31, 32, 33], "shiftntopdown": [30, 31, 32, 33], "took": [30, 31, 32, 33], "040758m": 30, "905970176": 30, "905969664": 30, "3302": 30, "12397": 30, "12407": 30, "encount": [30, 55], "affect": [30, 55], "accuraci": [30, 55], "subnorm": 30, "dynamic_3fc_lite_hps_trt": 30, "tensorrt_plan": [30, 31, 32, 33], "type_int32": [30, 31, 32, 33], "mmodel_repo": 30, "pythonpath": 30, "tensorflow2": 30, "dlrm_and_dcnv2": 30, "perf_data": 30, "minut": 30, "finish": [30, 31, 40, 41, 42, 53], "spark2json": 30, "dataset_path": 30, "binary_split_converted_data": 30, "num": [30, 31, 40, 41, 42, 51, 53], "2000000": [30, 42], "grpcinferenceservic": 30, "8001": 30, "httpservic": 30, "8002": 30, "sh": [30, 36, 38, 40, 41], "echo": [30, 41], "bash": [30, 38, 40], "25600": 30, "time_window": 30, "window": 30, "5000": [30, 31, 42, 51, 55], "msec": 30, "20941": 30, "1163": 30, "sec": 30, "851": 30, "standard": [30, 50, 55], "deviat": [30, 50], "1184": 30, "p50": 30, "p90": 30, "922": 30, "p95": 30, "977": 30, "p99": 30, "1190": 30, "846": [30, 41], "recv": 30, "343": 30, "108": [30, 47], "12800": 30, "14135": 30, "785": [30, 31, 40], "143": [30, 47], "1264": 30, "286": [30, 31, 40], "1236": 30, "1340": 30, "1374": 30, "1476": 30, "1258": 30, "1166": 30, "889": [30, 40], "619": [30, 40], "156": [30, 41, 47], "6400": 30, "8116": 30, "450": 30, "826": 30, "2206": [30, 32], "391": [30, 42, 47], "2183": 30, "2321": 30, "2368": 30, "2486": 30, "2199": 30, "118": [30, 47, 53], "2081": 30, "1632": 30, "1173": 30, "3200": [30, 51], "5311": 30, "295": [30, 41, 47], "3377": 30, "3349": 30, "3486": 30, "3530": 30, "3820": 30, "3370": 30, "155": 30, "3215": 30, "2591": 30, "162": [30, 45, 47], "2068": 30, "1600": [30, 51, 53], "3518": 30, "5109": 30, "5068": 30, "5242": 30, "5316": 30, "5741": 30, "5104": 30, "4933": 30, "4134": 30, "138": 30, "3742": 30, "800": [30, 31, 40, 41, 51, 53], "1910": 30, "9412": 30, "9384": 30, "9529": 30, "9581": 30, "10106": 30, "9406": 30, "294": [30, 32, 53], "9112": 30, "7674": 30, "267": 30, "7179": 30, "130": [30, 47], "400": [30, 31, 40, 41, 51, 53], "992": [30, 33], "1033": 30, "18132": 30, "726": 30, "18051": 30, "18257": 30, "18330": 30, "23069": 30, "18125": 30, "1278": 30, "16847": 30, "14999": 30, "476": [30, 40, 47], "14234": 30, "203": [30, 33, 41], "6081": 30, "34878": 30, "34734": 30, "35143": 30, "35288": 30, "40804": 30, "34872": 30, "2584": 30, "32288": 30, "516": [30, 40], "29340": 30, "870": [30, 47], "28111": 30, "270": [30, 31], "253": [30, 40], "053": 30, "71063": 30, "1570": 30, "70749": 30, "71666": 30, "73226": 30, "77979": 30, "71058": 30, "5092": 30, "65966": 30, "60716": 30, "1804": 30, "58482": 30, "333": [30, 40], "argpars": [30, 40, 42, 47], "argumentpars": [30, 40, 42], "glob": [30, 42, 47, 50], "defaultdict": [30, 46], "log_pattern": 30, "inference_benchmark": 30, "cmd_log": 30, "result_log": 30, "extract_result_from_log": 30, "log_path": 30, "job_log_pattern": 30, "readlin": 30, "job_log": 30, "each_job_log": 30, "add_argu": [30, 40, 42], "parse_arg": [30, 40, 42], "perf_result": 30, "idx": [30, 32], "tresult": 30, "prebuilt": 30, "undergo": 30, "soon": 30, "arm": 30, "particular": [30, 35, 50, 55], "yourself": [30, 43], "setup": [30, 35, 43, 55], "contrast": [30, 35], "advis": 30, "slight": 30, "alter": 30, "nvstage": 30, "dockerfil": [30, 35], "ctr": [30, 35, 37, 38, 39, 56], "sed": 30, "duse_huge_pag": 30, "action": [30, 40], "sudo": 30, "180000": 30, "node0": 30, "hugepag": [30, 41], "2048kb": 30, "nr_hugepag": 30, "reus": 30, "accomplish": 30, "suggest": 30, "hctr_src": 30, "chmod": 30, "lab": [30, 47, 48, 55], "predcondit": 30, "outlin": [30, 35], "itself": 30, "data_parquet": [31, 41], "561": [31, 41, 47], "564": [31, 40, 41], "568": [31, 40, 41, 47], "gen_0": [31, 41, 53], "204": [31, 42], "gen_1": [31, 41, 53], "455": 31, "gen_2": [31, 41, 53], "709": 31, "gen_3": [31, 41, 53], "gen_4": [31, 41, 53], "gen_5": [31, 41, 53], "gen_6": [31, 41, 53], "gen_7": [31, 41, 53], "gen_8": [31, 41, 53], "gen_9": [31, 41, 53], "411": [31, 47, 53], "gen_10": [31, 41, 53], "650": [31, 40], "gen_11": [31, 41, 53], "885": [31, 40, 47], "gen_12": [31, 41, 53], "gen_13": [31, 41, 53], "341": [31, 47], "gen_14": [31, 41, 53], "577": [31, 41], "gen_15": [31, 41, 53], "818": 31, "827": 31, "066": [31, 53], "537": [31, 40], "751": [31, 40], "mpi4pi": [31, 40, 41, 42, 43, 51, 53], "0001": [31, 32, 42], "dlrm_hugectr_graph": 31, "dlrm_hugectr": 31, "cuipcopenmemhandle_v2": 31, "gnu": [31, 41], "libcuda": 31, "539": [31, 40], "2950905596": 31, "542": [31, 47], "698": 31, "peer": [31, 40, 41, 42, 51, 53], "all2al": [31, 40, 41, 42, 51, 53, 55], "699": [31, 41, 47], "700": [31, 40, 47, 51, 53], "705": [31, 47], "782": [31, 47], "max_vocabulary_size_per_gpu_": [31, 41, 42, 51, 53], "3413333": 31, "791": [31, 40, 41, 47], "analysi": [31, 40, 41, 42, 51, 53, 55], "795": [31, 40], "772": [31, 40, 41, 47], "gpu0": [31, 41, 42, 51, 53], "warm": [31, 36, 41, 42, 51, 53, 55], "480": [31, 40, 53], "001000": [31, 41, 42, 51, 53], "522": [31, 40, 47], "72017": 31, "693168": [31, 53], "64947": 31, "694016": 31, "600": [31, 40, 41, 51, 53], "60927": 31, "69323": 31, "432": [31, 47], "60078": 31, "693079": 31, "050": [31, 40], "60162": 31, "693134": 31, "206": [31, 41], "498656": 31, "156138": 31, "rank0": [31, 41, 42, 51, 53], "456": [31, 47, 53], "958": [31, 40, 47], "optimz": [31, 41, 42, 51, 53], "514": [31, 40, 47], "555": [31, 47], "693": 31, "694": 31, "823": [31, 42, 47], "414": [31, 40], "dlrm_hugectr0_sparse_1000": 31, "dlrm_hugectr_dense_1000": 31, "dlrm_hugectr_dens": 31, "graph_config": [31, 41], "convert_embed": [31, 41], "unknown_1": 31, "elif": [31, 32, 40], "unknown_2": 31, "dlrm_hugectr_with_hp": 31, "dlrm_with_hp": 31, "262": [31, 41], "1014": 31, "886": [31, 40], "1239": 31, "cuda_module_load": [31, 32], "env": [31, 32, 33, 53], "onnx2trt_util": [31, 32, 33], "377": [31, 32, 40, 47], "down": [31, 32, 33], "812": [31, 47], "813": 31, "189": 31, "239950": 31, "205": [31, 41], "419": [31, 40], "335": [31, 40], "146": 31, "5763": 31, "1314": 31, "5879": 31, "1368": 31, "kfaster_dynamic_shapes_0805": 31, "preview": [31, 55], "34118830080": 31, "20304": 31, "10752": 31, "scratch": [31, 32, 33, 35, 36, 55], "32505856": 31, "4628": 31, "09284m": 31, "48099840": 31, "6321": 31, "1580": 31, "6322": 31, "1590": 31, "ten": [31, 32, 33], "cmdline": [31, 32, 33], "con": [31, 32, 33], "sorrt": [31, 32, 33], "libtriton_tensorrt": [31, 32, 33], "capab": [31, 32, 33], "iliti": [31, 32, 33], "ectori": [31, 32, 33], "bac": [31, 32, 33], "kend": [31, 32, 33], "shutil": [31, 32, 33, 42, 50], "as_numpi": [31, 32, 33], "49642828": 31, "52846366": 31, "99999994": 31, "9999992": 31, "9999905": 31, "dataload": [32, 47], "dlrm_pytorch": 32, "dlrm_pytorch_spars": 32, "onnx_path": 32, "modified_onnx_path": 32, "dlrm_pytorch_with_hp": 32, "tqdm": [32, 46, 47, 48, 51], "tqdmwarn": 32, "iprogress": 32, "ipywidget": [32, 47], "readthedoc": 32, "en": 32, "stabl": 32, "user_instal": 32, "autonotebook": 32, "notebook_tqdm": 32, "sequenti": [32, 47], "add_modul": 32, "_linear_layer_": 32, "_relu_layer_": 32, "inplac": [32, 47, 51], "transpos": 32, "index_select": 32, "from_pretrain": [32, 48], "bot_mlp": 32, "interaction_lay": 32, "top_mlp": 32, "criterion": 32, "bceloss": 32, "x0_iter": 32, "from_numpi": 32, "pin_memori": 32, "drop_last": 32, "x1_iter": 32, "y_iter": 32, "squeez": [32, 33, 47, 48], "zero_grad": 32, "state_dict": [32, 47], "bottom_linear_layer_1": 32, "in_featur": [32, 47], "out_featur": [32, 47], "bottom_relu_layer_1": 32, "bottom_linear_layer_2": 32, "bottom_relu_layer_2": 32, "bottom_linear_layer_3": 32, "bottom_relu_layer_3": 32, "top_linear_layer_1": 32, "479": [32, 33, 40], "top_relu_layer_1": 32, "top_linear_layer_2": 32, "top_relu_layer_2": 32, "top_linear_layer_3": 32, "top_relu_layer_3": 32, "top_linear_layer_4": 32, "top_relu_layer_4": 32, "top_linear_layer_5": 32, "top_relu_layer_5": 32, "1652954816818237": 32, "7626148462295532": 32, "1845550537109375": 32, "7347715497016907": 32, "0786197185516357": 32, "9271171689033508": 32, "7060756683349609": 32, "7490934133529663": 32, "8274499773979187": 32, "7962949275970459": 32, "6947690844535828": 32, "7241608500480652": 32, "7649394869804382": 32, "7043794393539429": 32, "6948238611221313": 32, "7003152370452881": 32, "7330600619316101": 32, "711887001991272": 32, "6917610168457031": 32, "7227296233177185": 32, "7232402563095093": 32, "7025701999664307": 32, "6962350010871887": 32, "7100769281387329": 32, "7159318923950195": 32, "6963521242141724": 32, "7058508396148682": 32, "7144895792007446": 32, "7082542181015015": 32, "6955724954605103": 32, "6997341513633728": 32, "7167338132858276": 32, "6962475776672363": 32, "6955674290657043": 32, "7098587155342102": 32, "6992183327674866": 32, "6928209066390991": 32, "6933107972145081": 32, "697549045085907": 32, "6969214677810669": 32, "6935250163078308": 32, "6948344111442566": 32, "7015650868415833": 32, "6928752660751343": 32, "6936203837394714": 32, "6962599158287048": 32, "6941655278205872": 32, "6939643025398254": 32, "6933950185775757": 32, "6970551013946533": 32, "0014": 32, "9997": 32, "9991": 32, "0004": 32, "0005": 32, "0002": 32, "dummy_kei": 32, "dummy_numerical_featur": 32, "randn": 32, "input_nam": 32, "output_nam": [32, 41], "dynamic_ax": 32, "ipykernel_52545": 32, "1281679600": 32, "tracerwarn": 32, "incorrect": 32, "stride": [32, 47], "requires_grad": 32, "gather_output_0": 32, "onnx_nam": 32, "gemm_output_0": 32, "gemm": [32, 55], "transb": 32, "114": [32, 40, 47, 54], "relu_output_0": 32, "1455": 32, "constant_output_0": 32, "cpulongtyp": 32, "reshape_output_0": 32, "allowzero": 32, "concat_output_0": 32, "3456": 32, "transpose_output_0": 32, "perm": 32, "matmul_output_0": 32, "729": [32, 47], "gather_33": 32, "351": [32, 33, 40], "concat_1_output_0": 32, "268": 32, "1035": 32, "497": 32, "1259": 32, "543": [32, 47], "652": [32, 40], "653": [32, 40, 47, 53], "209": [32, 47], "220": 32, "280": [32, 41], "433": 32, "331": [32, 47, 53], "144": [32, 33, 47], "5771": 32, "933": [32, 40], "115": [32, 40, 47], "5886": 32, "987": [32, 53], "34103362048": 32, "45142016": 32, "011619m": 32, "58774016": 32, "5933": 32, "1043": 32, "5128022": 32, "51312006": 32, "51246136": 32, "5129204": 32, "51302147": 32, "513144": 32, "dlrm_tf": 33, "dlrm_tf_spars": 33, "032517": 33, "963734": 33, "1638": 33, "30974": 33, "171392": 33, "2197505": 33, "897": [33, 47], "578464": 33, "executor": 33, "1209": 33, "abort": 33, "invalid_argu": 33, "_2": 33, "51200": 33, "892396": 33, "xla": 33, "169": [33, 42, 47], "0x55e0fdfeb330": 33, "892450": 33, "streamexecutor": 33, "897903": 33, "mlir": 33, "dump_mlir_util": 33, "269": [33, 47], "crash": [33, 55], "mlir_crash_reproducer_directori": 33, "379151": 33, "stream_executor": 33, "cuda_dnn": 33, "424": [33, 40], "8902": 33, "502058": 33, "device_compil": 33, "lifetim": [33, 55], "_baseoptim": 33, "_update_step_xla": 33, "0x7fa9660adab0": 33, "reduce_retrac": 33, "68028259277344": 33, "2571352064": 33, "639234": 33, "4132346": 33, "20792958": 33, "5957": 33, "8994140625": 33, "231005": 33, "96875": 33, "185315": 33, "3125": 33, "151740": 33, "43695": 33, "6640625": 33, "45556": 33, "24609375": 33, "131654": 33, "78125": 33, "8805829286575317": 33, "49121": 33, "47265625": 33, "60609": 33, "62109375": 33, "676294": 33, "375": [33, 40, 47], "31208": 33, "66015625": 33, "156789": 33, "65625": 33, "103213": 33, "1015625": 33, "394046783447266": 33, "10789": 33, "5703125": 33, "2716": 33, "05859375": 33, "139559": 33, "130419": 33, "13583": 33, "6923828125": 33, "7378": 33, "22802734375": 33, "81185": 33, "40625": 33, "18370": 33, "3314": 33, "90478515625": 33, "15871": 33, "3154296875": 33, "545": [33, 40, 47], "2841796875": 33, "1281": 33, "3038330078125": 33, "52890": 33, "2550": 33, "232177734375": 33, "4526": 33, "03759765625": 33, "5832462310791": 33, "22301483154297": 33, "7525691986084": 33, "034607887268066": 33, "6510401964187622": 33, "275766372680664": 33, "707094430923462": 33, "7623991966247559": 33, "5783321857452393": 33, "8166252374649048": 33, "885994553565979": 33, "912842869758606": 33, "7323049902915955": 33, "7469371557235718": 33, "8475004434585571": 33, "serializ": 33, "get_config": 33, "proper": 33, "248789": 33, "721088": 33, "126": 33, "926": [33, 47], "868": [33, 40, 41, 47], "302": [33, 41, 47, 55], "255": [33, 41, 47, 53], "04": [33, 42, 44, 45, 47, 50, 51, 53], "unsqueez": [33, 47], "dlrm_tf_with_hp": 33, "2013": 33, "4018": 33, "721": 33, "421": [33, 40], "4516": 33, "793": [33, 40, 47], "374": 33, "774": [33, 47], "fp8_quant": [33, 55], "775": 33, "860": [33, 40, 47], "863": 33, "864": 33, "869": [33, 40, 42, 47], "902": [33, 42], "947": [33, 40, 41], "51968": 33, "047": [33, 40], "069": [33, 40, 42], "077": 33, "034216": 33, "8710": 33, "1051": 33, "8711": 33, "18350080": 33, "007954m": 33, "31981568": 33, "8764": 33, "1091": 33, "1101": 33, "00mdlrm_tf_with_hp": 33, "00mconfig": 33, "tritonbackend_modelinstanceiniti": 33, "dlrm_tf_with_hps_0": 33, "34091672": 33, "demo_for_pytorch_trained_model": 34, "demo_for_hugectr_trained_model": 34, "instal": [34, 35, 41, 43, 46, 47, 48, 49, 50, 53, 55], "benchmark_tf_trained_large_model": 34, "147gb": [34, 55], "interconnect": 34, "bz": 34, "2tb": 34, "gen4": 34, "1396": [34, 41], "sxm5": 34, "platinum": 34, "8480c": 34, "gen5": 34, "773": [34, 40, 41, 47], "nvl": 34, "94gb": 34, "grace": [34, 55], "480gb": 34, "c2c": 34, "grate": 35, "interest": 35, "submit": [35, 54], "bug": [35, 55], "review": [35, 44], "think": 35, "priorit": 35, "comment": [35, 55], "propos": 35, "ahead": [35, 55], "pend": [35, 55], "forget": 35, "properli": [35, 41, 55], "ask": 35, "approv": 35, "clarif": [35, 55], "hesit": 35, "promptli": 35, "contributor": [35, 38, 55], "journei": 35, "1007": 35, "56a762eae3f8": 35, "dst_imag": 35, "docker_fil": 35, "rmm_ver": 35, "vnightli": 35, "cudf_ver": 35, "nvtab_ver": 35, "hugectr_dev_mod": 35, "cli": [35, 41], "varnam": 35, "quiet": 35, "suppress": [35, 55], "devel": 35, "cmake_build_typ": 35, "eval_batch": [35, 55], "enable_multinod": [35, 43], "enable_infer": 35, "enable_hdf": 35, "AND": 35, "enable_s3": [35, 53], "amazon": [35, 55], "sdk": [35, 53], "skk": 35, "denable_hdf": [35, 36], "denable_s3": [35, 53], "denable_multinod": [35, 43], "cmake_install_prefix": [35, 43, 55], "dcmake_install_prefix": [35, 43], "devel_infer": 35, "full": [36, 40, 46, 55], "varieti": 36, "8xa100": 36, "localizedslotembeddinghash": 36, "aren": 36, "distributedslotembeddinghash": 36, "localizedslotembeddingonehot": 36, "gender": 36, "wouldn": 36, "easi": [36, 55], "openmpi": 36, "gpudirect": 36, "dcn_2node_8gpu": 36, "footprint": 36, "tensorcor": 36, "mixed_precis": 36, "arithmet": 36, "underflow": 36, "exchang": [36, 54], "onnx_convert": [36, 41, 55], "hugectr2onnx_demo": 36, "ofembed": 36, "thing": 36, "redund": 36, "novelgpu": 36, "forintegr": 36, "hugectr_wdl_predict": 36, "hierrach": 36, "difficult": 36, "confer": 37, "websit": [37, 39], "titl": [37, 45], "date": 37, "speaker": 37, "video": [37, 44], "episod": 37, "\u52a0\u901f\u7684\u63a8\u8350\u7cfb\u7edf\u6846\u67b6": 37, "joei": 37, "wang": 37, "\u4e2d\u6587": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u5982\u4f55\u52a0\u901f\u63a8\u7406": 37, "\u4f7f\u7528": 37, "\u52a0\u901f": 37, "\u8bad\u7ec3": 37, "gem": 37, "guo": 37, "gtc": 37, "sping": 37, "march": 37, "matthia": [37, 43], "langer": [37, 43], "yingcan": [37, 43], "wei": [37, 43], "yu": 37, "fan": [37, 40], "english": 37, "apsara": 37, "\u63a8\u8350\u7cfb\u7edf": 37, "oct": 37, "spring": 37, "tencent": 37, "advertis": [37, 55], "april": 37, "xiangt": 37, "kong": 37, "Into": 37, "minseok": 37, "lee": 37, "jianb": 37, "dong": 37, "china": 37, "2020": [37, 53], "\u6df1\u5165\u7814\u7a76\u6027\u80fd\u4f18\u5316": 37, "\u6027\u80fd\u63d0\u5347": 37, "\u500d": 37, "\u7684\u9ad8\u6027\u80fd": 37, "\u5e7f\u544a\u63a8\u8350\u52a0\u901f\u7cfb\u7edf\u7684\u843d\u5730\u5b9e\u73b0": 37, "\u63a8\u7406\u8fc7\u7a0b": 37, "\u5c06": 37, "\u96c6\u6210\u4e8e": 37, "estim": [37, 38, 39, 55, 56], "2019": 37, "\u52a0\u901f\u7684\u63a8\u8350\u7cfb\u7edf\u8bad\u7ec3": 37, "wechat": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e09": 37, "\u96c6\u6210\u5230tensorflow": 37, "nov": 37, "devblog": 37, "\u5206\u5c42\u53c2\u6570\u670d\u52a1\u5668\u6269\u5c55\u63a8\u8350\u7cfb\u7edf\u63a8\u7406": 37, "august": 37, "shashank": 37, "verma": 37, "wenwen": 37, "gao": 37, "jerri": [37, 43], "shi": [37, 43], "kit": [37, 43, 55], "\u7cfb\u5217\u4e4b\u4e8c": 37, "june": 37, "kunlun": 37, "li": 37, "\u7cfb\u5217\u4e4b\u4e00": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e8c": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e00": 37, "jan": 37, "sept": 37, "vinh": [37, 43], "nguyen": [37, 43], "ann": 37, "spencer": 37, "meituan": 37, "interview": 37, "jun": [37, 40], "huang": 37, "sheng": 37, "luo": 37, "benedikt": 37, "schiffer": 37, "\u6269\u5c55\u548c\u52a0\u901f\u5927\u578b\u6df1\u5ea6\u5b66\u4e60\u63a8\u8350\u7cfb\u7edf": 37, "\u7cfb\u5217\u7b2c": 37, "\u90e8\u5206": 37, "\u7684": 37, "\u8bad\u7ec3\u5927\u578b\u6df1\u5ea6\u5b66\u4e60\u63a8\u8350\u6a21\u578b": 37, "ashish": 37, "sardana": 37, "ir": 37, "aug": 37, "oldridg": 37, "juli": 37, "massiv": [38, 55], "bottleneck": [38, 47], "record": [38, 42, 55], "homogen": 38, "easier": [38, 55], "sign": 38, "advanc": 38, "p100": 38, "pascal": 38, "team": [38, 55], "research": 38, "dcn_norm_generate_train": 38, "wdl_norm_generate_train": 38, "dlrm_raw_generate_train": 38, "dcn_parquet_generate_train": 38, "criteo_data": [38, 40], "panda": [38, 40, 41, 45, 46, 49, 51, 55], "introduct": [39, 55], "overarch": 39, "bring": 39, "cell": [40, 41, 43], "shell": 40, "softlink": 40, "kaggl": [40, 55], "occurr": 40, "postfix": [40, 50], "day_1": 40, "wdl_data": 40, "3rd": 40, "4th": 40, "embodi": 40, "5th": 40, "6th": 40, "soft": [40, 42], "project_root": 40, "home": 40, "wget": [40, 41, 42, 46], "cail": [40, 42], "day_0": [40, 42], "gz": [40, 41, 42], "deepfm_data_nvt": 40, "nvt": [40, 42, 50, 51], "ln": [40, 41, 42], "smi": 40, "460": [40, 47], "disp": 40, "uncorr": 40, "ecc": 40, "temp": [40, 42], "perf": [40, 55], "pwr": 40, "mig": 40, "00000000": 40, "33c": 40, "p0": 40, "42w": 40, "300w": 40, "0mib": 40, "16160mib": 40, "35c": 40, "45w": 40, "36c": 40, "44w": 40, "8a": [40, 41], "34c": 40, "41w": 40, "gi": 40, "ci": 40, "pid": 40, "dlrm_train": [40, 55], "use_dynamic_hash_t": 40, "shard_plan": 40, "round_robin": 40, "store_tru": 40, "generate_shard_plan": 40, "target_gpu": 40, "gpu_id": 40, "mp_tabl": 40, "6000": [40, 42], "dp_tabl": 40, "use_embedding_collect": 40, "num_embed": 40, "ebc": 40, "emb_vec_list": 40, "emb_vec": 40, "relu3": [40, 53], "relu4": [40, 53], "fc5": [40, 53], "relu5": [40, 53], "fc6": [40, 53], "relu6": [40, 53], "fc7": [40, 53], "relu7": [40, 53], "fc8": [40, 53], "3508545476": 40, "637": 40, "4714": 40, "4441": 40, "609": [40, 53], "5378": 40, "5339": 40, "4636": 40, "4480": 40, "4949": 40, "5183": 40, "789": [40, 53], "790": 40, "792": [40, 41], "919": [40, 42], "max_row_group_s": [40, 41, 42], "133678": 40, "022": 40, "134102": 40, "029": 40, "0804": 40, "0457": 40, "030": 40, "0183": 40, "032": 40, "1121": 40, "033": 40, "035": 40, "0378": 40, "0222": 40, "038": 40, "0691": 40, "039": 40, "0925": 40, "9636": 40, "043": 40, "9363": 40, "044": 40, "0300": 40, "0261": 40, "9558": 40, "049": 40, "9402": 40, "9871": 40, "052": 40, "0105": 40, "6863": 40, "224": [40, 47], "6589": 40, "330": 40, "7527": 40, "474": 40, "7488": 40, "6785": 40, "646": 40, "6628": 40, "755": [40, 53], "7097": 40, "7332": 40, "040": 40, "4089": 40, "175": [40, 47], "3816": 40, "4753": 40, "467": [40, 47, 53], "617": [40, 47, 54], "4011": 40, "3855": 40, "921": 40, "4324": 40, "063": [40, 42], "4558": 40, "221": 40, "1016": 40, "7546": 40, "7253": 40, "410": [40, 47, 53], "8425": 40, "412": [40, 42, 53], "8308": 40, "413": [40, 41, 42, 47, 53], "7957": 40, "9031": 40, "415": [40, 53], "9578": 40, "417": 40, "6531": 40, "418": 40, "6238": 40, "420": [40, 47], "8386": 40, "7410": 40, "422": 40, "7292": 40, "6941": 40, "425": [40, 42], "8015": 40, "426": 40, "8562": 40, "558": [40, 47], "4051": 40, "1921": 40, "567": [40, 41], "1628": 40, "570": [40, 47], "3777": 40, "573": 40, "2800": [40, 51], "576": 40, "2683": 40, "579": 40, "2332": 40, "582": 40, "3406": 40, "585": 40, "3953": 40, "587": [40, 47], "0088": [40, 41], "1824": 40, "1531": 40, "589": [40, 41], "3679": 40, "590": [40, 47], "2703": 40, "591": 40, "2585": 40, "592": 40, "2234": 40, "593": 40, "3308": 40, "595": [40, 47], "457": 40, "data0": 40, "data3": 40, "data4": 40, "data5": 40, "data6": 40, "data7": 40, "data8": 40, "data9": 40, "data10": 40, "data11": 40, "data12": 40, "data13": 40, "data14": 40, "data15": 40, "data16": 40, "data17": 40, "data18": 40, "data19": 40, "data20": 40, "data21": 40, "data22": 40, "data23": 40, "data24": 40, "data25": 40, "embeddingcollection0": 40, "emb_vec0": 40, "emb_vec1": 40, "emb_vec2": 40, "emb_vec3": 40, "emb_vec4": 40, "emb_vec5": 40, "emb_vec6": 40, "emb_vec7": 40, "emb_vec8": 40, "emb_vec9": 40, "emb_vec10": 40, "emb_vec11": 40, "emb_vec12": 40, "emb_vec13": 40, "emb_vec14": 40, "emb_vec15": 40, "emb_vec16": 40, "emb_vec17": 40, "emb_vec18": 40, "emb_vec19": 40, "emb_vec20": 40, "emb_vec21": 40, "emb_vec22": 40, "emb_vec23": 40, "emb_vec24": 40, "emb_vec25": 40, "500000": [40, 41], "458": 40, "14373": 40, "24478": 40, "697": [40, 47], "23782": 40, "142604": 40, "168333": 40, "865": 40, "142137": 40, "25698": 40, "19912": 40, "142685": 40, "1404": 40, "24589": 40, "18021": 40, "143021": 40, "211": [40, 42], "139695": 40, "25073": 40, "245": 40, "16407": 40, "141111": 40, "13893": 40, "24958": 40, "17112": 40, "141069": 40, "138218": 40, "25123": 40, "18422": 40, "135439": 40, "759": 40, "137244": 40, "25471": 40, "803": [40, 53], "19334": 40, "139792": 40, "136812": 40, "2416": 40, "17574": 40, "140519": 40, "135968": 40, "25386": 40, "18238": 40, "134846": 40, "291": [40, 55], "134873": 40, "23619": 40, "3445591887": 40, "383": 40, "384": [40, 47], "385": [40, 42, 47], "386": 40, "628": 40, "643": [40, 41, 47], "651": [40, 47], "654": 40, "939": [40, 41], "946": [40, 41, 47], "997": 40, "0258": 40, "0417": 40, "0144": 40, "011": [40, 41, 42, 53], "1042": 40, "015": 40, "0339": 40, "020": 40, "024": [40, 41], "0652": 40, "0886": [40, 41], "071": 40, "075": [40, 42], "9285": 40, "084": 40, "9480": 40, "092": [40, 41], "9324": 40, "9792": [40, 42], "101": 40, "0027": 40, "332": [40, 55], "9753": 40, "746": 40, "748": [40, 47], "749": 40, "9675": 40, "752": 40, "9519": 40, "9988": 40, "757": 40, "8738": 40, "8464": 40, "760": 40, "762": [40, 47, 53], "763": 40, "8660": 40, "765": [40, 47], "8503": 40, "767": 40, "8972": 40, "9207": 40, "911": 40, "917": 40, "4128": 40, "924": 40, "4792": 40, "930": 40, "4050": 40, "3894": 40, "937": [40, 41, 47], "4363": 40, "940": [40, 41], "4597": 40, "941": [40, 41], "4031": 40, "942": [40, 47], "3757": 40, "944": [40, 47], "4695": 40, "945": [40, 47], "4656": 40, "3796": 40, "948": [40, 47], "4265": 40, "950": [40, 47], "4500": [40, 51], "841": [40, 47], "842": [40, 47], "251": [40, 53], "143524": 40, "34586": 40, "345": [40, 47], "48449": 40, "142247": 40, "657": 40, "141641": 40, "33134": 40, "40384": 40, "142243": 40, "139913": 40, "33118": 40, "161": 40, "40793": 40, "142713": 40, "138901": 40, "34956": 40, "40618": 40, "140238": 40, "883": 40, "138208": 40, "34071": 40, "38745": 40, "140117": 40, "326": 40, "137638": 40, "34076": 40, "42352": 40, "135055": 40, "727": [40, 47, 53], "137268": 40, "728": 40, "33588": 40, "819": [40, 53], "38619": 40, "139783": 40, "193": 40, "136816": 40, "3762": 40, "43341": 40, "140772": 40, "581": [40, 47], "136368": 40, "3521": 40, "673": 40, "41807": 40, "135264": 40, "985": 40, "135726": 40, "34242": 40, "198655838": 40, "517": 40, "730": [40, 47], "731": 40, "732": 40, "896": 40, "907": 40, "913": [40, 47], "914": 40, "915": [40, 47], "969": 40, "002": 40, "004": 40, "005": [40, 53], "007": [40, 53], "008": [40, 53], "012": 40, "013": 40, "014": 40, "017": 40, "021": 40, "023": 40, "025": 40, "081": 40, "121": [40, 41], "423": [40, 41, 47], "505": [40, 53], "145": 40, "559": [40, 42, 47], "747": [40, 47], "275": 40, "091": [40, 42], "133": [40, 42], "361": [40, 42, 53], "0203": 40, "364": [40, 42, 55], "365": [40, 41, 42, 53], "0515": 40, "367": 40, "9460": 40, "0046": 40, "9890": 40, "371": [40, 47], "1355": 40, "372": 40, "8269": 40, "373": [40, 47], "9187": 40, "376": 40, "9500": 40, "8445": 40, "8875": 40, "3660": 40, "525": [40, 47], "4578": 40, "528": 40, "531": [40, 53], "4890": 40, "3835": 40, "538": 40, "4421": 40, "544": [40, 42, 47], "5730": 40, "3562": 40, "546": [40, 47], "548": [40, 47], "550": [40, 47], "3738": 40, "552": [40, 47], "4167": 40, "5632": 40, "594": 40, "599": 40, "144991": 40, "22035": 40, "633": [40, 47], "03885": 40, "144124": 40, "144851": 40, "1863": 40, "98102": 40, "145444": 40, "540": 40, "141821": 40, "18638": 40, "96441": 40, "144249": 40, "139519": 40, "18203": 40, "556": [40, 41, 47], "97548": 40, "140895": 40, "490": 40, "13942": 40, "491": 40, "19363": 40, "533": 40, "97628": 40, "141202": 40, "465": [40, 47], "13947": 40, "18342": 40, "97817": 40, "136504": 40, "138534": 40, "19586": 40, "96355": 40, "14067": 40, "138213": 40, "20188": 40, "98811": 40, "142139": 40, "138044": 40, "19324": 40, "427": [40, 47, 50], "96149": 40, "136835": 40, "137419": 40, "18732": 40, "grow": [40, 55], "1217153067": 40, "506": 40, "485": [40, 41, 47], "486": 40, "662": 40, "669": 40, "670": 40, "671": [40, 42, 47], "672": [40, 47], "862": [40, 49], "866": [40, 47], "871": 40, "872": [40, 53], "873": [40, 41, 42], "875": [40, 53], "876": 40, "878": 40, "881": 40, "882": 40, "884": [40, 47], "949": 40, "055": 40, "157": [40, 47], "780": [40, 53], "953": [40, 47], "150": [40, 41, 53], "434": [40, 47], "786": 40, "8152": 40, "787": 40, "7878": 40, "9441": 40, "8699": 40, "8542": 40, "9011": 40, "9246": 40, "797": 40, "7136": 40, "798": 40, "802": [40, 47], "7683": 40, "805": [40, 47], "7996": 40, "806": [40, 47], "8230": 40, "2527": 40, "943": [40, 47], "2253": 40, "3074": 40, "955": [40, 47], "2917": 40, "3386": 40, "961": 40, "3621": 40, "962": [40, 41], "2429": 40, "964": 40, "2156": 40, "965": 40, "3718": 40, "966": [40, 47], "967": [40, 42, 47], "2976": 40, "968": 40, "2820": 40, "3289": 40, "970": 40, "3523": [40, 42], "859": 40, "static_map": 40, "553648128": 40, "142151": 40, "53912": 40, "26107": 40, "141023": 40, "141078": 40, "57008": 40, "10267": 40, "141925": 40, "309": [40, 47, 53], "140561": 40, "55499": 40, "362": [40, 42, 47, 55], "13614": 40, "14338": 40, "139972": 40, "54929": 40, "464": 40, "10246": 40, "141379": 40, "139553": 40, "56729": 40, "11698": 40, "141421": 40, "642": [40, 41], "139362": 40, "56153": 40, "696": 40, "11376": 40, "136499": 40, "138972": 40, "60721": 40, "811": 40, "11548": 40, "141355": 40, "138726": 40, "56329": 40, "10124": 40, "142614": 40, "139617": 40, "5483": 40, "14957": 40, "138442": 40, "138159": 40, "57499": 40, "ensembl": [41, 43, 55], "inferenceon": 41, "739": 41, "638": 41, "715": 41, "986": 41, "142": 41, "218": 41, "hps_demo": [41, 43], "reshape2": [41, 42, 51], "1100": [41, 51, 53], "ground_truth": 41, "2598678435": 41, "565": 41, "566": 41, "636": 41, "808": 41, "810": 41, "21845": 41, "0047": 41, "6921": 41, "0092": 41, "6824": 41, "207": [41, 47], "208": 41, "213": 41, "658": [41, 47], "444961": 41, "693355": 41, "508793": 41, "694358": 41, "422282": 41, "695494": 41, "764": 41, "175263": 41, "691037": 41, "174492": 41, "688767": 41, "503806": 41, "000913": 41, "093": [41, 42], "148": 41, "279": 41, "hps_demo_with_embed": 41, "hps_demo_dense_1000": 41, "sparse_model": [41, 55], "hps_demo0_sparse_1000": 41, "hps_demo1_sparse_1000": 41, "hps_demo_without_embed": 41, "parameterserverconfig": 41, "pd": [41, 45, 46, 49, 51], "onnxruntim": 41, "ort": 41, "key_offset": 41, "cumsum": 41, "ps_config": 41, "emb_table_nam": 41, "max_feature_num_per_sample_per_emb_t": 41, "inference_params_arrai": 41, "df": [41, 50, 53], "read_parquet": [41, 50, 51], "dense_input_column": 41, "cat_input1_column": 41, "cat_input2_column": 41, "loc": [41, 51], "to_numpi": 41, "cat_input1": 41, "cat_input2": 41, "embedding1": 41, "flatten": 41, "embedding2": 41, "get_output": 41, "input_fe": 41, "get_input": 41, "sess_ref": 41, "res_ref": 41, "pred_ref": 41, "diff_ref": 41, "mse_ref": 41, "18488": 41, "18470": 41, "4895492": 41, "509022": 41, "38192913": 41, "5264926": 41, "50650454": 41, "47927693": 41, "48954916": 41, "50902206": 41, "38192907": 41, "52649266": 41, "5065045": 41, "4792769": 41, "3887142e": 41, "566238532": 41, "3543": 41, "cleanunusedinitializersandnodearg": 41, "key_to_indice_hash_all_t": 41, "lookup_fromdlpack": [41, 55], "capsul": [41, 55], "to_dlpack": 41, "key_capsul": 41, "out_capsul": 41, "out_put": 41, "from_dlpack": 41, "runtimeerror": 41, "cuda_devic": 41, "is_avail": [41, 42], "10028": 41, "10004": 41, "0307": 41, "0264": 41, "0294": 41, "0151": 41, "0281": 41, "eager": 41, "out_tensor": 41, "out_dlcapsul": 41, "729218": 41, "182": [41, 42], "168630": 41, "1639": 41, "30048": 41, "170043": 41, "30184": 41, "171618": 41, "173095": 41, "174795": 41, "176299": 41, "177782": 41, "179411": 41, "20005": 41, "30047": 41, "20004": 41, "30001": 41, "20037": 41, "02182689": 41, "01806355": 41, "01985828": 41, "0136845": 41, "01738386": 41, "00323257": 41, "unix": 41, "primari": [41, 55], "secondari": 41, "multi_process_hp": 41, "multiprocess": [41, 46], "create_hp": 41, "num_max_process": 41, "subprocess": [41, 46], "getpid": 41, "await": 41, "sleep": 41, "eras": 41, "lost": 41, "delet": [41, 55], "revok": 41, "preserv": 41, "risidu": 41, "monitor": 41, "counter": 41, "destroi": 41, "far": 41, "1394": 41, "1397": 41, "270453215232": 41, "269706559488": 41, "17179868672": 41, "313": 41, "multiprocesshashmapbackend": [41, 55], "289": [41, 47, 53], "311": [41, 53], "281": 41, "282": 41, "260310085632": 41, "7783505728": 41, "463": [41, 47], "706": 41, "711": [41, 53], "842594773": 41, "3887142264200634e": 41, "497305659": 41, "101124718": 41, "176": [41, 42], "687": 41, "detach": [41, 47, 48], "progress": [41, 55], "mock": 41, "tar": [41, 47], "archiv": [41, 50], "rf": 41, "xf": 41, "sf": 41, "112": [41, 47], "443": 41, "sent": 41, "codeload": 41, "ref": 41, "gzip": [41, 42], "87m": 41, "50mb": 41, "3011655": 41, "tmr": 41, "mkreleasehdr": 41, "broken": [41, 55], "pipe": 41, "34mcc": 41, "33mmakefil": 41, "dep": 41, "sentinel": 41, "gcda": 41, "gcno": 41, "gcov": 41, "lcov": 41, "makefil": 41, "adlist": 41, "quicklist": 41, "ae": 41, "anet": 41, "sd": 41, "zmalloc": 41, "lzf_c": 41, "lzf_d": 41, "pqsort": 41, "zipmap": 41, "sha1": 41, "ziplist": 41, "replic": 41, "t_string": 41, "t_list": 41, "t_set": 41, "t_zset": 41, "t_hash": 41, "pubsub": 41, "intset": 41, "syncio": 41, "crc16": 41, "endianconv": 41, "slowlog": 41, "bio": 41, "rio": 41, "rand": [41, 49], "memtest": 41, "syscheck": 41, "crcspeed": 41, "crc64": 41, "bitop": 41, "notifi": 41, "setproctitl": 41, "hyperloglog": 41, "sparklin": 41, "geo": 41, "lazyfre": 41, "expir": 41, "geohash": 41, "geohash_help": 41, "childinfo": 41, "defrag": 41, "siphash": 41, "rax": 41, "t_stream": 41, "listpack": 41, "localtim": 41, "lolwut": 41, "lolwut5": 41, "lolwut6": 41, "acl": 41, "sha256": 41, "timeout": 41, "setcpuaffin": 41, "monoton": 41, "mt19937": 41, "resp_pars": 41, "call_repli": 41, "script_lua": 41, "function_lua": 41, "redisassert": 41, "cli_common": 41, "distclean": 41, "clean": [41, 42, 50, 55], "linenois": 41, "lua": 41, "jemalloc": 41, "hdr_histogram": 41, "leav": 41, "xo": 41, "commandfilt": 41, "testrdb": 41, "infotest": 41, "misc": 41, "hook": 41, "blockonkei": 41, "blockonbackground": 41, "scan": 41, "datatype2": 41, "auth": 41, "keyspace_ev": 41, "blockedcli": 41, "getkei": 41, "getchannel": 41, "test_lazyfre": 41, "defragtest": 41, "keyspec": 41, "zset": 41, "mallocs": 41, "aclcheck": 41, "subcommand": 41, "repli": 41, "cmdintrospect": 41, "eventloop": 41, "moduleconfig": 41, "moduleconfigstwo": 41, "usercal": 41, "pedant": 41, "dredis_stat": 41, "c11": [41, 53], "wall": [41, 50], "wno": 41, "o2": 41, "malloc": 41, "build_tl": 41, "use_systemd": 41, "cflag": 41, "ldflag": 41, "redis_cflag": 41, "redis_ldflag": 41, "prev_final_cflag": 41, "ggdb": 41, "duse_jemalloc": 41, "prev_final_ldflag": 41, "rdynam": 41, "1mmake": 41, "1mhiredi": 41, "c99": 41, "o3": 41, "fpic": 41, "wstrict": 41, "prototyp": 41, "wwrite": 41, "net": [41, 47, 48, 50], "sockcompat": 41, "rc": 41, "libhiredi": 41, "1mlinenois": 41, "1mlua": 41, "dlua_ansi": 41, "denable_cjson_glob": 41, "dlua_use_mkstemp": 41, "myldflag": 41, "lapi": 41, "lcode": 41, "ldebug": 41, "ldo": 41, "ldump": 41, "lfunc": 41, "lgc": 41, "llex": 41, "lmem": 41, "lobject": 41, "lopcod": 41, "lparser": 41, "lstate": 41, "lstring": 41, "ltabl": 41, "ltm": 41, "lundump": 41, "lvm": 41, "lzio": 41, "strbuf": 41, "fpconv": 41, "lauxlib": 41, "lbaselib": 41, "ldblib": 41, "liolib": 41, "lmathlib": 41, "loslib": 41, "ltablib": 41, "lstrlib": 41, "loadlib": 41, "linit": 41, "lua_cjson": 41, "lua_struct": 41, "lua_cmsgpack": 41, "lua_bit": 41, "liblua": 41, "dll": 41, "ranlib": 41, "lm": 41, "luac": 41, "1mhdr_histogram": 41, "dhdr_malloc_includ": 41, "hdr_redis_malloc": 41, "libhdrhistogram": 41, "1mjemalloc": 41, "g0": 41, "lg": 41, "quantum": 41, "je_": 41, "gnu99": 41, "g3": 41, "funrol": 41, "xsltproc": 41, "gcc": 41, "iso": 41, "c89": 41, "crai": 41, "gnu11": 41, "wextra": 41, "wshorten": 41, "wsign": 41, "wundef": 41, "preprocessor": 41, "libstdc": 41, "linkag": 41, "grep": 41, "egrep": 41, "ansi": 41, "stat": 41, "stdlib": 41, "inttyp": 41, "stdint": 41, "unistd": 41, "bigendian": 41, "void": 41, "intmax_t": 41, "pc": 41, "paus": 41, "nm": 41, "gawk": 41, "mawk": 41, "usabl": [41, 55], "presenc": 41, "malloc_usable_s": 41, "__attribute__": 41, "syntax": 41, "fvisibl": 41, "hidden": [41, 48], "werror": 41, "herror_on_warn": 41, "tls_model": 41, "alloc_s": 41, "gnu_printf": 41, "printf": 41, "bsd": 41, "ld": 41, "autoconf": 41, "memalign": 41, "valloc": 41, "backtrac": 41, "sbrk": 41, "utrac": 41, "__builtin_unreach": 41, "__builtin_ffsl": 41, "__builtin_popcountl": 41, "lg_page": 41, "pthread": 41, "pthread_creat": 41, "lpthread": 41, "dlfcn": 41, "dlsym": 41, "pthread_atfork": 41, "pthread_setname_np": 41, "clock_gettim": 41, "clock_monotonic_coars": 41, "clock_monoton": 41, "mach_absolute_tim": 41, "syscal": 41, "secure_getenv": 41, "sched_getcpu": 41, "sched_setaffin": 41, "issetugid": 41, "_malloc_thread_cleanup": 41, "_pthread_mutex_init_calloc_cb": 41, "__atom": 41, "__sync": 41, "darwin": 41, "osatom": 41, "madvis": 41, "madv_fre": 41, "madv_dontne": 41, "madv_do": 41, "nt": 41, "madv_": 41, "__builtin_clz": 41, "os_unfair_lock_": 41, "glibc": 41, "mutex": 41, "d_gnu_sourc": 41, "strerror_r": 41, "stdbool": 41, "conform": 41, "_bool": 41, "xsl": 41, "manpag": 41, "xml": 41, "jemalloc_macro": 41, "jemalloc_proto": 41, "jemalloc_typedef": 41, "jemalloc_preambl": 41, "jemalloc_test": 41, "stamp": 41, "jeprof": 41, "jemalloc_def": 41, "jemalloc_internal_def": 41, "jemalloc_test_def": 41, "public_symbol": 41, "private_symbol": 41, "awk": 41, "private_symbols_jet": 41, "public_namespac": 41, "public_unnamespac": 41, "jemalloc_protos_jet": 41, "jemalloc_renam": 41, "jemalloc_mangl": 41, "jemalloc_mangle_jet": 41, "revis": [41, 55], "configure_cflag": 41, "specified_cflag": 41, "extra_cflag": 41, "cppflag": 41, "d_reentrant": 41, "cxx": 41, "configure_cxxflag": 41, "specified_cxxflag": 41, "extra_cxxflag": 41, "extra_ldflag": 41, "dso_ldflag": 41, "wl": 41, "sonam": 41, "lstdc": 41, "rpath_extra": 41, "xslroot": 41, "bindir": 41, "datadir": 41, "includedir": 41, "libdir": 41, "mandir": 41, "man": 41, "srcroot": 41, "abs_srcroot": 41, "objroot": 41, "abs_objroot": 41, "jemalloc_prefix": 41, "jemalloc_private_namespac": 41, "install_suffix": 41, "malloc_conf": 41, "autogen": 41, "experimetal_smallocx": 41, "prof": 41, "libunwind": 41, "libgcc": 41, "xmalloc": 41, "lazy_lock": 41, "oblivi": 41, "libjemalloc": 41, "iinclud": 41, "djemalloc_no_private_namespac": 41, "sym": 41, "arena": 41, "background_thread": 41, "bitmap": 41, "ckh": 41, "ctl": 41, "div": 41, "extent": 41, "extent_dss": 41, "extent_mmap": 41, "malloc_io": 41, "mutex_pool": 41, "nstime": 41, "prng": 41, "rtree": 41, "safety_check": 41, "sc": 41, "sz": 41, "tcach": 41, "test_hook": 41, "ticker": 41, "tsd": 41, "wit": 41, "private_namespac": 41, "gen": 41, "cp": 41, "jemalloc_cpp": 41, "cru": 41, "33madlist": 41, "33mquicklist": 41, "33mae": 41, "33manet": 41, "33mdict": 41, "33mserver": 41, "33msd": 41, "33mzmalloc": 41, "33mlzf_c": 41, "33mlzf_d": 41, "33mpqsort": 41, "33mzipmap": 41, "33msha1": 41, "33mziplist": 41, "33mreleas": 41, "33mnetwork": 41, "33mutil": 41, "33mobject": 41, "33mdb": 41, "33mreplic": 41, "33mrdb": 41, "33mt_string": 41, "33mt_list": 41, "33mt_set": 41, "33mt_zset": 41, "33mt_hash": 41, "33mconfig": 41, "33maof": 41, "33mpubsub": 41, "33mmulti": 41, "33mdebug": 41, "33msort": 41, "33mintset": 41, "33msyncio": 41, "33mcluster": 41, "33mcrc16": 41, "33mendianconv": 41, "33mslowlog": 41, "33meval": 41, "33mbio": 41, "33mrio": 41, "33mrand": 41, "33mmemtest": 41, "33msyscheck": 41, "33mcrcspeed": 41, "33mcrc64": 41, "33mbitop": 41, "33msentinel": 41, "33mnotifi": 41, "33msetproctitl": 41, "33mblock": 41, "33mhyperloglog": 41, "33mlatenc": 41, "33msparklin": 41, "33mredi": 41, "33mgeo": 41, "33mlazyfre": 41, "33mmodul": 41, "33mevict": 41, "33mexpir": 41, "33mgeohash": 41, "33mgeohash_help": 41, "33mchildinfo": 41, "33mdefrag": 41, "33msiphash": 41, "33mrax": 41, "33mt_stream": 41, "33mlistpack": 41, "33mlocaltim": 41, "33mlolwut": 41, "33mlolwut5": 41, "33mlolwut6": 41, "33macl": 41, "33mtrack": 41, "33mconnect": 41, "33mtl": 41, "33msha256": 41, "33mtimeout": 41, "33msetcpuaffin": 41, "33mmonoton": 41, "33mmt19937": 41, "33mresp_pars": 41, "33mcall_repli": 41, "33mscript_lua": 41, "33mscript": 41, "33mfunction": 41, "33mfunction_lua": 41, "33mcommand": 41, "1mlink": 41, "1mredi": 41, "1minstal": 41, "33mredisassert": 41, "33mcli_common": 41, "hint": 41, "idea": 41, "conf": 41, "daemon": 41, "appendonli": 41, "7001": 41, "7002": 41, "shutdown": [41, 42, 55], "pkill": 41, "1m": 41, "0mmaster": 41, "5460": 41, "master": 41, "5461": 41, "10922": 41, "10923": 41, "16383": 41, "fa9bb82124685a6438a696cc1562693ccc815ff0": 41, "c6d7ad6353bf568d17a147e65b8198ded9d65717": 41, "5462": 41, "e26ae6cfbeea8a1e6367444445364d963ae17436": 41, "0mwait": 41, "0mm": 41, "coverag": 41, "num_node_connect": 41, "572": [41, 47], "redisclust": 41, "134": [41, 47, 53], "230052244": 41, "setupt": 41, "24mb": 41, "duse_openssl": 41, "use_ssl": 41, "dhiredis_test_ssl": 41, "libhiredis_ssl": 41, "encyrypt": 41, "test_cert": 41, "openssl": 41, "redis_serv": 41, "keyusag": 41, "digitalsignatur": 41, "keyencipher": 41, "hugectr_cli": 41, "nscerttyp": 41, "genrsa": 41, "public": 41, "rsa": 41, "pubout": 41, "dummi": 41, "req": 41, "x509": 41, "subj": 41, "cn": 41, "dai": [41, 42, 54], "cakei": 41, "caseri": 41, "ser": 41, "cacreateseri": 41, "extfil": 41, "subject": 41, "cert": 41, "cacert": 41, "a441806db5506b7600ee8ae794fa01dc31ac83c9": 41, "6fa93392a396aa3c321736234b7eafc86bb1f979": 41, "8e9cd68cc229fcb568a84d7358011201b4246046": 41, "644": [41, 47], "984": 41, "990": 41, "995": 41, "998": 41, "conclud": 41, "022623188": 41, "hugectr_e2": 42, "base_dir": 42, "data_dir": 42, "train_dir": 42, "val_dir": 42, "model_dir": 42, "decom": 42, "unzip": [42, 45], "filterwarn": 42, "simplefilt": 42, "dask_cudf": [42, 50], "dask_cuda": 42, "localcudaclust": 42, "dask": [42, 50], "device_mem_s": 42, "pynvml_mem_s": 42, "categorifi": [42, 50], "fillmiss": 42, "get_embedding_s": [42, 50, 51], "basicconfig": 42, "asctim": 42, "setlevel": 42, "notset": 42, "getlogg": 42, "asyncio": 42, "schema": [42, 50], "categorical_column": [42, 50], "continuous_column": 42, "label_column": [42, 50], "criteo_column": 42, "cross_column": 42, "c1_c2": 42, "c3_c4": 42, "num_integer_column": 42, "num_categorical_column": 42, "num_total_column": 42, "dashboard": 42, "dashboard_port": 42, "8787": 42, "tcp": 42, "visible_devic": 42, "delect": 42, "device_limit_frac": 42, "spill": 42, "device_pool_frac": 42, "part_mem_frac": 42, "device_s": 42, "device_limit": 42, "device_pool_s": 42, "part_siz": [42, 50], "fmem": 42, "1e9": 42, "bewar": 42, "n_worker": 42, "device_memory_limit": 42, "dashboard_address": 42, "rmm_pool_siz": 42, "061": 42, "preload": 42, "062": 42, "072": 42, "087": 42, "acc90f7f": 42, "fb72": 42, "11ed": 42, "808f": 42, "54ab3adac0a5": 42, "c0d46f34": 42, "503": 42, "789d4132": 42, "7d07": 42, "451f": 42, "ac": 42, "1867dfa9d7b3": 42, "comm": 42, "33423": 42, "40925": 42, "43851": 42, "nanni": 42, "40143": 42, "6pb36hck": 42, "40769": 42, "44353": 42, "43979": 42, "rv8itza6": 42, "45255": 42, "37165": 42, "46241": 42, "co2ru8ea": 42, "40555": 42, "37399": 42, "36117": 42, "04qjh_rt": 42, "39951": 42, "42631": 42, "46323": 42, "9zzs6cz6": 42, "40815": 42, "37909": 42, "40533": 42, "hq437puc": 42, "42963": 42, "41947": 42, "42201": 42, "kuwua5fi": 42, "39607": 42, "45371": 42, "39667": 42, "ouyeimq6": 42, "train_output": 42, "val_output": 42, "train_input": 42, "val_input": 42, "preprocess_dir_temp_train": 42, "preprocess_dir_temp_v": 42, "makedir": 42, "preprocess_dir_temp": 42, "cudf": [42, 50, 55], "one_path": 42, "rmtree": [42, 50], "train_valid_path": 42, "temp_output": 42, "ddf": 42, "read_csv": [42, 45, 46, 49], "sep": 42, "feature_pair": 42, "to_parquet": [42, 45, 49, 50], "train_path": [42, 50], "valid_path": [42, 50], "categorify_op": 42, "cat_featur": [42, 50], "cont_featur": 42, "min_valu": 42, "cross_cat_op": 42, "output_format": 42, "train_ds_iter": 42, "valid_ds_iter": 42, "per_partit": [42, 50], "dict_dtyp": [42, 50], "col": [42, 50], "transform": [42, 44, 47, 48, 50], "to_hugectr": 42, "output_path": [42, 50], "embeddings_dict_cat": 42, "embeddings_dict_cross": 42, "ndask": 42, "1234907": 42, "19683": 42, "13780": 42, "6867": 42, "18490": 42, "6264": 42, "1235": 42, "854680": 42, "114026": 42, "75736": 42, "2159": 42, "7533": 42, "1307783": 42, "404742": 42, "1105613": 42, "87714": 42, "9032": 42, "1577645": 42, "1093030": 42, "187256813049316": 42, "data_path": 42, "model_path": 42, "1581605": 42, "4000": [42, 51], "2720": 42, "1350": 42, "wide_redn": 42, "dropout2": 42, "add1": 42, "21000": 42, "mpiinitservic": 42, "4031005480": 42, "353": [42, 47], "355": 42, "475000": 42, "0018": 42, "7234": 42, "366": 42, "7175": 42, "7946054": 42, "6990506": 42, "0788": 42, "3132": 42, "392": 42, "7372800": 42, "396": [42, 47], "3516": 42, "5847": 42, "397": [42, 47], "2162": 42, "0056": 42, "3464": 42, "874": [42, 50], "429": [42, 53], "70458": 42, "124098": 42, "6176": 42, "130088": 42, "835": 42, "3000": [42, 51], "61959": 42, "101731": 42, "449": 42, "61009": 42, "110557": 42, "738497": 42, "47924": 42, "1046": 42, "10236": 42, "61852": 42, "102157": 42, "771": 42, "58452": 42, "123451": 42, "61023": 42, "122763": 42, "867": [42, 47], "698276": 42, "48087": 42, "487": 42, "0999177": 42, "103": [42, 47], "61106": 42, "0999892": 42, "722": 42, "11000": 42, "61545": 42, "0883301": 42, "348": [42, 53], "12000": [42, 55], "62134": 42, "0828304": 42, "688598": 42, "4733": 42, "13000": 42, "0717": 42, "108287": 42, "14000": 42, "62997": 42, "0745141": 42, "15000": 42, "60764": 42, "0720452": 42, "287": [42, 47], "16000": 42, "61101": 42, "0851126": 42, "758": 42, "685426": 42, "47088": 42, "17000": 42, "0865": 42, "0632745": 42, "18000": 42, "62825": 42, "0742994": 42, "626": 42, "19000": 42, "61035": 42, "0679226": 42, "230": 42, "59954": 42, "0779185": 42, "704": 42, "684045": 42, "4736": 42, "733": 42, "119": 42, "398": [42, 47], "611": 42, "903": [42, 47], "788": [42, 47], "5538": 42, "0770708": 42, "But": [43, 55], "development": 43, "repo": 43, "pybind11": 43, "hugectr_e2e_demo_with_nvtabular": 43, "continuous_train": 43, "multi_gpu_offline_infer": 43, "training_and_inference_with_remote_filesystem": 43, "modal": [43, 45, 46, 55], "movi": [43, 44, 45, 50, 52], "movielen": [43, 44, 50, 51, 52, 55], "25m": [43, 44, 46, 49, 52], "xiaolei": 43, "training_with_remote_filesystem": 43, "price": 44, "purchas": 44, "Such": 44, "rich": [44, 46], "poster": [44, 45, 52], "plot": [44, 46, 48], "synopsi": [44, 45, 52], "music": 44, "audio": 44, "lyric": 44, "itinerari": 44, "plan": [44, 55], "attract": 44, "photo": 44, "resnet": [44, 52], "bert": [44, 55], "pretrain": [44, 50], "enrich": [44, 45, 52], "etl": 44, "000": 45, "subsequ": 45, "sklearn": [45, 55], "model_select": 45, "train_test_split": 45, "download_fil": 45, "input_data_dir": [45, 50, 51], "ml": [45, 46, 49], "grouplen": 45, "movieid": [45, 46, 49, 50, 51], "genr": [45, 50], "toi": 45, "stori": 45, "1995": 45, "adventur": 45, "anim": 45, "children": [45, 47], "comedi": 45, "fantasi": 45, "jumanji": 45, "grumpier": 45, "old": [45, 55], "men": 45, "romanc": 45, "exhal": 45, "drama": 45, "father": 45, "bride": 45, "ii": 45, "movies_convert": [45, 50], "timestamp": [45, 55], "1147880044": 45, "1147868817": 45, "1147868828": 45, "665": 45, "1147878820": 45, "1147868510": 45, "simpl": [45, 49, 55], "test_siz": 45, "random_st": 45, "wish": [45, 46], "proce": [45, 46, 49], "sypnopsi": 46, "scrap": 46, "imdbpi": [46, 48], "ipython": [46, 47, 48], "do_shutdown": [46, 47, 48], "meta": 46, "ia": 46, "director": 46, "the_matrix": 46, "get_movi": 46, "0114709": [46, 47, 49], "get_movie_infoset": 46, "imdbid": [46, 49], "nuniqu": 46, "pickl": [46, 47, 48, 49], "cpu_count": 46, "basemanag": 46, "dictproxi": 46, "movies_id": 46, "movies_info": [46, 48], "movie_info": [46, 48], "risk": 46, "num_job": 46, "chunk_siz": 46, "proc": 46, "pkl": [46, 47, 48, 49], "highest_protocol": [46, 47, 48], "collect_large_post": 46, "filelist": [46, 47], "targetlist": 46, "largefilelist": 46, "largetargetlist": 46, "target_path": 46, "poster_smal": [46, 47], "jpg": [46, 47], "poster_larg": 46, "download_task": 46, "cmd": 46, "popen": 46, "wc": 46, "nvidia_resnet50": 47, "checkout": [47, 55], "5d6d417ff57e8824ef51573e00e5e21307b39697": 47, "classif": [47, 55], "convnet": 47, "pil": 47, "amp": 47, "autocast": 47, "image_classif": 47, "torchvis": [47, 48], "resnet50": 47, "resnext101_32x4d": 47, "se_resnext101_32x4d": 47, "efficientnet_b0": 47, "efficientnet_b4": 47, "efficientnet_widese_b0": 47, "efficientnet_widese_b4": 47, "efficientnet_quant_b0": 47, "efficientnet_quant_b4": 47, "available_model": 47, "load_jpeg_from_fil": 47, "image_s": 47, "img_transform": 47, "compos": 47, "resiz": 47, "centercrop": 47, "totensor": 47, "img": 47, "no_grad": [47, 48], "wherea": 47, "view": [47, 55], "229": [47, 53], "mono": 47, "channel": 47, "sub_": 47, "div_": 47, "check_quant_weight_correct": 47, "checkpoint_path": 47, "map_loc": 47, "startswith": 47, "quantizers_sd_kei": 47, "_amax": 47, "named_modul": 47, "quantiz": [47, 55], "sd_all_kei": 47, "imgnet_class": 47, "loc_synset_map": 47, "model_arg": 47, "pretrained_from_fil": 47, "nvidia_resnet50_200821": 47, "pth": 47, "resnet50_pyt_amp": 47, "hub": 47, "conv1": 47, "conv2d": 47, "kernel_s": 47, "bn1": 47, "batchnorm2d": 47, "momentum": [47, 55], "affin": 47, "track_running_stat": 47, "maxpool": 47, "maxpool2d": 47, "dilat": 47, "ceil_mod": 47, "conv2": 47, "bn2": 47, "conv3": 47, "bn3": 47, "downsampl": 47, "layer2": 47, "layer4": 47, "avgpool": 47, "adaptiveavgpool2d": 47, "output_s": 47, "61951": 47, "0055323": 47, "0274711": 47, "0055320": 47, "0054197": 47, "1791658": 47, "1288589": 47, "0365653": 47, "2324928": 47, "6000478": 47, "num_bathc": 47, "array_split": 47, "strip": 47, "feature_extractor": 47, "feature_dict": [47, 49], "unabl": 47, "0168199": 47, "0118926": 47, "0415856": 47, "0494260": 47, "0810772": 47, "02it": 47, "0049314": 47, "23it": 47, "0066831": 47, "29it": 47, "0888693": 47, "11it": 47, "0067431": 47, "21it": 47, "6522546": 47, "0057811": 47, "5176252": 47, "0112373": 47, "47it": 47, "4636254": 47, "41it": 47, "0365658": 47, "20it": 47, "2124046": 47, "0104469": 47, "14it": 47, "0102493": 47, "17it": 47, "0051792": 47, "65it": 47, "0110017": 47, "0139630": 47, "83it": 47, "0143348": 47, "92it": 47, "0037618": 47, "0040002": 47, "70it": 47, "0317950": 47, "52it": 47, "0850669": 47, "0325258": 47, "6569888": 47, "0037736": 47, "0109303": 47, "44it": 47, "0103882": 47, "59it": 47, "0267287": 47, "24it": 47, "0100033": 47, "43it": 47, "1601215": 47, "46it": [47, 51], "0092028": 47, "0075963": 47, "3267334": 47, "69it": 47, "0059398": 47, "78it": 47, "0122565": 47, "82it": 47, "0052572": 47, "102": [47, 53], "38it": 47, "6404896": 47, "28it": 47, "0027428": 47, "0033883": 47, "0113270": 47, "0022286": 47, "25it": 47, "0068953": 47, "13it": 47, "0042949": 47, "0130297": 47, "15it": 47, "0028207": 47, "0054244": 47, "10it": 47, "1275680": 47, "0036533": 47, "0037297": 47, "51it": 47, "0962736": 47, "0042548": 47, "34it": 47, "0038109": 47, "0104009": 47, "22it": 47, "0180316": 47, "26it": 47, "0071925": 47, "139": 47, "31it": 47, "0087001": 47, "0056910": 47, "0064563": 47, "1720040": 47, "149": 47, "0041112": 47, "16it": 47, "4412528": 47, "0051362": 47, "158": 47, "0029992": 47, "0384309": 47, "0028367": 47, "50it": 47, "0038336": 47, "32it": 47, "0058725": 47, "164": 47, "0113328": 47, "166": 47, "3878542": 47, "33it": 47, "0026465": 47, "0040588": 47, "0086984": 47, "178": 47, "40it": 47, "0309047": 47, "181": 47, "0031405": 47, "185": 47, "0097493": 47, "186": 47, "09it": 47, "0346336": 47, "0078841": 47, "0018795": 47, "9151704": 47, "1417097": 47, "0054223": 47, "0117477": 47, "199": 47, "64it": 47, "0000041": 47, "30it": 47, "0028907": 47, "0366179": 47, "0109761": 47, "217": 47, "39it": 47, "7167686": 47, "219": 47, "0048973": 47, "226": 47, "0100112": 47, "3606394": 47, "0021890": 47, "228": 47, "0033874": 47, "0035019": 47, "232": 47, "1228953": 47, "237": 47, "7688990": 47, "0052954": 47, "0092159": 47, "0094349": 47, "0065136": 47, "246": 47, "0027805": 47, "0034904": 47, "248": [47, 53], "18it": 47, "0037522": 47, "06it": 47, "0036301": 47, "254": [47, 53, 55], "0037324": 47, "35it": 47, "0053622": 47, "265": 47, "42it": 47, "7278178": 47, "266": 47, "37it": 47, "0418239": 47, "0040489": 47, "0069280": 47, "08it": 47, "0049143": 47, "0064840": 47, "285": [47, 50], "0070723": 47, "19it": 47, "0057997": 47, "0056072": 47, "7446332": 47, "0076618": 47, "04it": 47, "0290014": 47, "0347330": 47, "303": 47, "36it": 47, "0159620": 47, "304": 47, "0044667": 47, "07it": 47, "0040190": 47, "3088364": 47, "0230367": 47, "0037147": 47, "310": 47, "0033282": 47, "4028134": 47, "312": 47, "1352824": 47, "314": 47, "0079400": 47, "318": 47, "0449869": 47, "0047526": 47, "320": 47, "0095593": 47, "321": [47, 55], "2762334": 47, "322": 47, "0023293": 47, "0024593": 47, "327": 47, "1116182": 47, "328": [47, 53], "0063462": 47, "0119577": 47, "0106727": 47, "0053884": 47, "337": 47, "0037077": 47, "03it": 47, "0040064": 47, "0089108": 47, "0023129": 47, "347": 47, "0044827": 47, "12it": 47, "0067108": 47, "359": 47, "0432432": 47, "0202415": 47, "0074812": 47, "0059311": 47, "0065073": 47, "0052820": 47, "0120865": 47, "0064620": 47, "0068505": 47, "2934916": 47, "0040137": 47, "0071864": 47, "0072973": 47, "387": 47, "0449951": 47, "388": 47, "27it": 47, "0074605": 47, "0328955": 47, "0077294": 47, "393": [47, 53], "0987918": 47, "394": 47, "0067520": 47, "395": 47, "0220016": 47, "0067236": 47, "0085838": 47, "0047561": 47, "0066075": 47, "0123374": 47, "0026143": 47, "0064626": 47, "0822388": 47, "0101664": 47, "0403579": 47, "0070112": 47, "2323633": 47, "0203408": 47, "1167638": 47, "71it": 47, "0144178": 47, "48it": 47, "0295432": 47, "435": 47, "0123865": 47, "436": 47, "55it": 47, "0110530": 47, "0082817": 47, "45it": 47, "0067525": 47, "0046333": 47, "439": 47, "0248953": 47, "0000033": 47, "0069165": 47, "0000014": 47, "0000027": 47, "05it": 47, "0063531": 47, "0041431": 47, "0831387": 47, "3908598": 47, "0056341": 47, "3833520": 47, "472": 47, "0058660": 47, "0086847": 47, "0074455": 47, "477": 47, "0037990": 47, "481": 47, "1764600": 47, "0372764": 47, "0368576": 47, "0368574": 47, "0366178": 47, "484": 47, "0067118": 47, "488": 47, "0044954": 47, "496": 47, "0078950": 47, "498": 47, "0050957": 47, "0058374": 47, "499": 47, "0027963": 47, "507": 47, "0362590": 47, "508": 47, "0008309": 47, "509": 47, "0065240": 47, "0055022": 47, "0418753": 47, "0070768": 47, "1706680": 47, "518": 47, "3836530": 47, "0050545": 47, "61it": 47, "8752440": 47, "523": 47, "81it": [47, 48], "0019504": 47, "0060117": 47, "526": 47, "1172060": 47, "3280916": 47, "0039502": 47, "3800796": 47, "0074238": 47, "0062032": 47, "0053891": 47, "0184115": 47, "0060968": 47, "0075165": 47, "549": 47, "0076998": 47, "0060176": 47, "0092745": 47, "0079936": 47, "0060747": 47, "2523756": 47, "554": [47, 50], "0092217": 47, "0046906": 47, "0206226": 47, "0086484": 47, "0175471": 47, "0085913": 47, "0233687": 47, "0053214": 47, "0032794": 47, "0040765": 47, "0064541": 47, "0365109": 47, "569": 47, "0337721": 47, "0032234": 47, "0344604": 47, "574": 47, "0041349": 47, "53it": 47, "0180073": 47, "6926486": 47, "583": 47, "0079596": 47, "586": 47, "0140603": 47, "0069745": 47, "0066154": 47, "1745787": 47, "0045995": 47, "0038675": 47, "0068971": 47, "596": 47, "0050205": 47, "598": 47, "0085175": 47, "0424237": 47, "603": [47, 53], "0190524": 47, "3365778": 47, "8119752": 47, "0031742": 47, "610": 47, "0100465": 47, "614": 47, "0072097": 47, "0071771": 47, "0174997": 47, "0033676": 47, "623": [47, 53], "0443567": 47, "0047559": 47, "627": 47, "0260295": 47, "0200768": 47, "640": 47, "0245238": 47, "0075679": 47, "0042418": 47, "645": 47, "0036814": 47, "0079756": 47, "0983922": 47, "0058642": 47, "659": 47, "0116016": 47, "663": 47, "0092238": 47, "666": 47, "2226519": 47, "0414982": 47, "0419641": 47, "0040246": 47, "0217168": 47, "674": 47, "0038452": 47, "675": 47, "3155242": 47, "0038255": 47, "0043153": 47, "0072209": 47, "686": 47, "0074797": 47, "688": 47, "2720826": 47, "690": 47, "0068227": 47, "0372765": 47, "0083713": 47, "0252133": 47, "0329913": 47, "703": 47, "0036840": 47, "56it": 47, "0067956": 47, "2195566": 47, "708": 47, "0080549": 47, "714": [47, 53], "0073398": 47, "716": 47, "0038205": 47, "718": 47, "0117220": 47, "719": 47, "0046198": 47, "0060351": 47, "0081568": 47, "0046921": 47, "0034739": 47, "0023251": 47, "0491764": 47, "0090642": 47, "741": [47, 53], "0037928": 47, "743": 47, "0457430": 47, "0057283": 47, "0462519": 47, "0110546": 47, "0045197": 47, "0062523": 47, "750": 47, "0112454": 47, "0065243": 47, "0396171": 47, "0059710": 47, "0080928": 47, "0126004": 47, "1833116": 47, "770": 47, "0075766": 47, "0123860": 47, "0123970": 47, "0323120": 47, "0035301": 47, "1216520": 47, "0028331": 47, "1330015": 47, "0062443": 47, "0485241": 47, "0154467": 47, "776": 47, "5235348": 47, "0191074": 47, "0060168": 47, "779": 47, "0081738": 47, "0379473": 47, "0063381": 47, "4427076": 47, "0173714": 47, "3794028": 47, "0464106": 47, "0090570": 47, "0087829": 47, "0041866": 47, "0444682": 47, "0058110": 47, "0072392": 47, "0080546": 47, "0064482": 47, "809": 47, "0044599": 47, "0439771": 47, "58it": 47, "0021756": 47, "820": 47, "0039676": 47, "0160801": 47, "0032981": 47, "0049854": 47, "2605312": 47, "0367257": 47, "829": 47, "6817944": 47, "0082081": 47, "1146283": 47, "0796335": 47, "0183355": 47, "0218094": 47, "0290820": 47, "845": 47, "1059793": 47, "0025665": 47, "848": 47, "0259786": 47, "854": 47, "0044369": 47, "0031127": 47, "857": 47, "0283644": 47, "0316599": 47, "0118767": 47, "0059758": 47, "0122194": 47, "0070404": 47, "0028484": 47, "0166792": 47, "0369903": 47, "0073115": 47, "0284655": 47, "9236264": 47, "892": 47, "0137094": 47, "893": 47, "0064323": 47, "895": 47, "49it": 47, "0062741": 47, "68it": 47, "0084237": 47, "901": 47, "0084273": 47, "4193400": 47, "906": 47, "0124307": 47, "908": 47, "0157383": 47, "0412808": 47, "0161860": 47, "918": 47, "4613254": 47, "2788556": 47, "925": 47, "1437361": 47, "3037582": 47, "0048211": 47, "4516162": 47, "0033932": 47, "0042871": 47, "57it": 47, "0137799": 47, "62it": 47, "1714196": 47, "0025117": 47, "2357144": 47, "1525898": 47, "0098088": 47, "6537238": 47, "0303151": 47, "951": 47, "0315632": 47, "0316352": 47, "0166557": 47, "956": 47, "0066879": 47, "3736766": 47, "0140340": 47, "959": [47, 53], "1570970": 47, "0075364": 47, "0099901": 47, "447": 47, "movies_poster_featur": [47, 49], "61504": 47, "huggingfac": 48, "jupyterlab": 48, "nbclassic": 48, "admin": 48, "pip3": 48, "cu111": 48, "torchaudio": 48, "whl": 48, "torch_stabl": 48, "barttoken": 48, "bartmodel": 48, "facebook": 48, "decod": 48, "return_tensor": 48, "pt": 48, "truncat": 48, "max_length": 48, "output_hidden_st": 48, "last_hidden_st": 48, "62423": [48, 49, 51], "average_embed": 48, "movies_synopsis_embed": [48, 49], "proceed": 49, "poster_featur": 49, "61947": 49, "text_featur": 49, "61291": 49, "tmdbid": 49, "0113497": 49, "8844": 49, "0113228": 49, "15602": 49, "0114885": 49, "31357": 49, "0113041": 49, "11862": 49, "0105812": 49, "feature_arrai": 49, "iterrow": [49, 51], "2049": 49, "poster_feature_": 49, "text_feature_": 49, "3073": [49, 51], "feature_df": [49, 51], "datafram": [49, 50], "poster_feature_0": [49, 51], "poster_feature_1": [49, 51], "poster_feature_2": [49, 51], "poster_feature_3": [49, 51], "poster_feature_4": [49, 51], "poster_feature_5": [49, 51], "poster_feature_6": [49, 51], "poster_feature_7": [49, 51], "poster_feature_8": [49, 51], "text_feature_1014": [49, 51], "text_feature_1015": [49, 51], "text_feature_1016": [49, 51], "text_feature_1017": [49, 51], "text_feature_1018": [49, 51], "text_feature_1019": [49, 51], "text_feature_1020": [49, 51], "text_feature_1021": [49, 51], "text_feature_1022": [49, 51], "text_feature_1023": [49, 51], "088281": 49, "036760": 49, "006470": 49, "023553": 49, "000163": 49, "238797": 49, "291230": 49, "197272": 49, "024294": 49, "307049": 49, "789571": 49, "084938": 49, "187339": 49, "061683": 49, "183281": 49, "356245": 49, "289105": 49, "134672": 49, "691380": 49, "045417": 49, "051422": 49, "203168": 49, "617449": 49, "443821": 49, "501953": 49, "736949": 49, "180542": 49, "313696": 49, "274087": 49, "153105": 49, "218745": 49, "187553": 49, "904370": 49, "069441": 49, "026665": 49, "817211": 49, "125072": 49, "173140": 49, "209240": 49, "451933": 49, "491917": 49, "743956": 49, "069061": 49, "900011": 49, "583347": 49, "192817": 49, "224088": 49, "182279": 49, "014646": 49, "004135": 49, "197796": 49, "077938": 49, "215127": 49, "021160": 49, "023108": 49, "394012": 49, "679462": 49, "225475": 49, "196255": 49, "169627": 49, "008575": 49, "172138": 49, "114755": 49, "127861": 49, "003679": 49, "082123": 49, "447287": 49, "002375": 49, "135956": 49, "989514": 49, "808180": 49, "317510": 49, "176658": 49, "078992": 49, "726118": 49, "017430": 49, "249834": 49, "183357": 49, "071451": 49, "644567": 49, "090399": 49, "147284": 49, "pyarrow": 49, "pypi": [49, 55], "satisfi": 49, "33mwarn": 49, "upgrad": [49, 50, 55], "026260": [49, 51], "857608": [49, 51], "410247": [49, 51], "066654": [49, 51], "382803": [49, 51], "899998": [49, 51], "511562": [49, 51], "592291": [49, 51], "565434": [49, 51], "636716": [49, 51], "578369": [49, 51], "996169": [49, 51], "402107": [49, 51], "412318": [49, 51], "859952": [49, 51], "293852": [49, 51], "341114": [49, 51], "727113": [49, 51], "085829": [49, 51], "141265": [49, 51], "721758": [49, 51], "679958": [49, 51], "955634": [49, 51], "391091": [49, 51], "324611": [49, 51], "505211": [49, 51], "258331": [49, 51], "048264": [49, 51], "161505": [49, 51], "431864": [49, 51], "836532": [49, 51], "525013": [49, 51], "654566": [49, 51], "823841": [49, 51], "818313": [49, 51], "856280": [49, 51], "638048": [49, 51], "685537": [49, 51], "119418": [49, 51], "911146": [49, 51], "470762": [49, 51], "762258": [49, 51], "626335": [49, 51], "768947": [49, 51], "241833": [49, 51], "775992": [49, 51], "236340": [49, 51], "865548": [49, 51], "387806": [49, 51], "668321": [49, 51], "552122": [49, 51], "750238": [49, 51], "863707": [49, 51], "382173": [49, 51], "894487": [49, 51], "565142": [49, 51], "164083": [49, 51], "538184": [49, 51], "980678": [49, 51], "643513": [49, 51], "928519": [49, 51], "794906": [49, 51], "201022": [49, 51], "744666": [49, 51], "962188": [49, 51], "915320": [49, 51], "777534": [49, 51], "904200": [49, 51], "167337": [49, 51], "875194": [49, 51], "180481": [49, 51], "815904": [49, 51], "808288": [49, 51], "036711": [49, 51], "902779": [49, 51], "580946": [49, 51], "772951": [49, 51], "239788": [49, 51], "061874": [49, 51], "162997": [49, 51], "388310": [49, 51], "236311": [49, 51], "162757": [49, 51], "207134": [49, 51], "111078": [49, 51], "250022": [49, 51], "335043": [49, 51], "091674": [49, 51], "121507": [49, 51], "418124": [49, 51], "150020": [49, 51], "803506": [49, 51], "059504": [49, 51], "002342": [49, 51], "932321": [49, 51], "manipul": 50, "terabyt": [50, 55], "rapid": 50, "apt": 50, "graphviz": 50, "ubuntu": 50, "focal": 50, "inreleas": 50, "ppa": 50, "launchpad": 50, "deadsnak": 50, "backport": 50, "33m": 50, "newest": [50, 55], "3build2": 50, "libarchive13": 50, "librhash0": 50, "libuv1": 50, "autoremov": 50, "newli": [50, 55], "columngroup": 50, "column_nam": 50, "op1": 50, "op2": 50, "sound": 50, "joinextern": 50, "left": 50, "acycl": 50, "dag": 50, "visual": 50, "contigu": 50, "fulfil": 50, "v0": [50, 54], "movieid_dup": 50, "_duplic": 50, "lambdaop": 50, "int8": 50, "manifest": 50, "matter": 50, "solv": 50, "break": 50, "demand": [50, 55], "hood": 50, "decomposit": 50, "lazili": 50, "couldn": 50, "train_dataset": 50, "100mb": 50, "valid_dataset": 50, "640002432": 50, "troubleshoot": 50, "160000608": 50, "scikit": [50, 55], "981": 50, "0x7fbb086a3370": 50, "\u00b5": 50, "restor": [50, 55], "162542": [50, 51], "56586": [50, 51], "movieid_dupl": [50, 51], "part_0": 50, "26460": 50, "97438": 50, "1704": 50, "105574": 50, "3568": 50, "39464": 50, "127724": 50, "movie_map": 51, "movieid_s": 51, "56581": 51, "209155": 51, "56582": 51, "209157": 51, "56583": 51, "209159": 51, "56584": 51, "209169": 51, "56585": 51, "209171": 51, "set_index": 51, "num_token": 51, "embedding_matrix": 51, "3967": 51, "3072": 51, "17294852": 51, "15285189": 51, "26095702": 51, "75369112": 51, "29602144": 51, "78917433": 51, "13539355": 51, "84843078": 51, "70951219": 51, "10441725": 51, "72871966": 51, "11719463": 51, "18514273": 51, "72422918": 51, "04273015": 51, "1404219": 51, "54169348": 51, "96875489": 51, "08307642": 51, "3673532": 51, "15777258": 51, "01297393": 51, "36267638": 51, "14848055": 51, "82188376": 51, "56516905": 51, "70838085": 51, "45119769": 51, "9273439": 51, "42464321": 51, "henc": [51, 55], "shall": 51, "plu": 51, "pretrained_embedding_s": 51, "convert_pretrained_embeddings_to_sparse_model": 51, "pre_trained_sparse_embed": 51, "hugectr_pretrained_embed": 51, "afterward": [51, 55], "noqa": 51, "pretrained_embed": 51, "10001": 51, "476440390": 51, "275735": 51, "16384000": 51, "256000": 51, "1072": 51, "297110": 51, "581705": 51, "274680": 51, "574425": 51, "746443": 51, "054157": 51, "332273": 51, "564224": 51, "277900": 51, "550730": 51, "764630": 51, "054009": 51, "434429": 51, "536507": 51, "279014": 51, "525059": 51, "773702": 51, "054287": 51, "335757": 51, "532503": 51, "278661": 51, "526352": 51, "779897": 51, "167787": 51, "447136": 51, "547141": 51, "376035": 51, "548916": 51, "784775": 51, "054224": 51, "334735": 51, "540766": 51, "277728": 51, "515882": 51, "786808": 51, "054551": 51, "1300": 51, "336372": 51, "531510": 51, "1400": [51, 53], "277408": 51, "511901": 51, "791416": 51, "165986": 51, "1500": 51, "554217": 51, "522047": 51, "279548": 51, "540521": 51, "793460": 51, "054801": 51, "1700": 51, "336303": 51, "525447": 51, "1800": [51, 53], "278906": 51, "523558": 51, "793137": 51, "054431": 51, "1900": 51, "336023": 51, "511348": 51, "384979": 51, "515268": 51, "796599": 51, "172160": 51, "2100": 51, "453174": 51, "526615": 51, "2200": 51, "278781": 51, "536789": 51, "798459": 51, "054509": 51, "2300": 51, "335596": 51, "508902": 51, "2400": 51, "277901": 51, "520411": 51, "798726": 51, "054518": 51, "2500": 51, "444557": 51, "490832": 51, "2600": 51, "279310": 51, "507799": 51, "801325": 51, "164203": 51, "2700": 51, "443310": 51, "519460": 51, "277569": 51, "512426": 51, "800731": 51, "054590": 51, "2900": 51, "336213": 51, "512216": 51, "384833": 51, "522102": 51, "803801": 51, "054133": 51, "3100": 51, "334245": 51, "507463": 51, "279046": 51, "526148": 51, "802950": 51, "070003": 51, "3300": 51, "352114": 51, "504611": 51, "3400": 51, "277292": 51, "502907": 51, "804364": 51, "054315": 51, "3500": 51, "442956": 51, "512927": 51, "3600": 51, "277974": 51, "519042": 51, "806404": 51, "054291": 51, "3700": 51, "335365": 51, "499368": 51, "3800": 51, "277786": 51, "509683": 51, "805164": 51, "064908": 51, "3900": 51, "344106": 51, "508182": 51, "387872": 51, "493841": 51, "808367": 51, "054222": 51, "4100": 51, "335361": 51, "508106": 51, "278802": 51, "519000": 51, "808897": 51, "054320": 51, "4300": 51, "334094": 51, "502797": 51, "4400": 51, "388990": 51, "508890": 51, "809649": 51, "074584": 51, "355005": 51, "505778": 51, "4600": 51, "277275": 51, "532776": 51, "810962": 51, "054498": 51, "4700": 51, "335553": 51, "503001": 51, "4800": 51, "279237": 51, "495762": 51, "808618": 51, "4900": 51, "449926": 51, "503213": 51, "277141": 51, "481138": 51, "810767": 51, "064807": 51, "untrain": 51, "5100": 51, "630313": 51, "485568": 51, "5200": 51, "278359": 51, "518924": 51, "811217": 51, "054624": 51, "5300": 51, "336246": 51, "516505": 51, "5400": 51, "384571": 51, "512404": 51, "811464": 51, "054350": 51, "5500": 51, "334675": 51, "500305": 51, "5600": 51, "279563": 51, "484969": 51, "bart": 52, "din": [53, 55], "0bcb014209e219273cb6fd4152df7df713cbac61": 53, "25t09": 53, "53z": 53, "protoc": 53, "4b40fff8bb27201ba07b6fa5651217fb": 53, "jar": 53, "172": 53, "dlrm_parquet": 53, "supergroup": 53, "112247365": 53, "112243637": 53, "112251207": 53, "112241764": 53, "112247838": 53, "112244076": 53, "112253553": 53, "112249557": 53, "112239093": 53, "112249156": 53, "lastli": [53, 55], "label0": 53, "c5": 53, "c6": 53, "c7": 53, "c8": 53, "c9": 53, "c10": 53, "c12": 53, "c13": 53, "c14": 53, "c15": 53, "c16": 53, "c17": 53, "c18": 53, "c19": 53, "c20": 53, "c21": 53, "c22": 53, "c23": 53, "c24": 53, "c25": 53, "c26": 53, "c27": 53, "c28": 53, "c29": 53, "c30": 53, "c31": 53, "c32": 53, "c33": 53, "c34": 53, "c35": 53, "c36": 53, "c37": 53, "c38": 53, "c39": 53, "train_with_hdf": 53, "datasourcetype_t": 53, "405274": 53, "72550": 53, "55008": 53, "222734": 53, "316071": 53, "156265": 53, "220243": 53, "200179": 53, "234566": 53, "335625": 53, "278726": 53, "263070": 53, "312542": 53, "203773": 53, "145859": 53, "117421": 53, "78140": 53, "3648": 53, "156308": 53, "94562": 53, "357703": 53, "386976": 53, "238046": 53, "230917": 53, "156382": 53, "10720": 53, "502": 53, "3218787045": 53, "607": 53, "529": 53, "530": 53, "a10": 53, "21954560": 53, "010000": 53, "716815": 53, "69327": 53, "856": 53, "719486": 53, "693207": 53, "750294": 53, "693568": 53, "721128": 53, "693352": 53, "78435": 53, "499891": 53, "5486": 53, "2728": 53, "693178": 53, "720984": 53, "693292": 53, "756448": 53, "693053": 53, "725832": 53, "693433": 53, "382": 53, "77763": 53, "693193": 53, "500092": 53, "57548": 53, "575": 53, "0_sparse_2000": 53, "_dense_2000": 53, "_opt_dense_2000": 53, "430": 53, "drwxr": 53, "xr": 53, "9479684": 53, "functionalit": 53, "dcn_parquet": 53, "train_with_s3": 53, "east": [53, 55], "39884": 53, "39043": 53, "17289": 53, "7420": 53, "20263": 53, "7120": 53, "1543": 53, "slice12": 53, "amazonaw": [53, 55], "pipeline_test": 53, "dcn_model": 53, "569406237": 53, "822": 53, "710": 53, "713": 53, "397821": 53, "2457600": 53, "1453": 53, "25574": 53, "712926": 53, "16987": 53, "701584": 53, "22653": 53, "696012": 53, "16121": 53, "698167": 53, "42367": 53, "695641": 53, "500979": 53, "0735": 53, "6575": 53, "696028": 53, "03696": 53, "693602": 53, "089": 53, "73903": 53, "693618": 53, "10101": 53, "696232": 53, "59704": 53, "50103": 53, "5882": 53, "473": 53, "0_sparse_1000": 53, "_dense_1000": 53, "_opt_dense_1000": 53, "843": 53, "988": 53, "denable_gc": 53, "enable_gc": 53, "gcp": 53, "credenti": 53, "environment": 53, "google_application_credenti": 53, "gcs_kei": 53, "train_with_gc": 53, "1008636636": 53, "308": 53, "323": 53, "236": 53, "22452": 53, "786299": 53, "6347": 53, "738846": 53, "22938": 53, "711017": 53, "63355": 53, "708317": 53, "850": 53, "11226": 53, "697101": 53, "501301": 53, "0298": 53, "6054": 53, "698077": 53, "744573": 53, "697804": 53, "244": 53, "04207": 53, "695543": 53, "761465": 53, "695323": 53, "28151": 53, "695319": 53, "647": 53, "501347": 53, "3576": 53, "664": 53, "804": 53, "submiss": 54, "ve": [54, 55], "billion": 54, "curv": 54, "dual": 54, "dgx1": 54, "emb_dim": 54, "6x": 54, "criteolab": 54, "criteo_script": [54, 55], "criteo2hugectr": 54, "tfrecord": 54, "chart": 54, "seven": 54, "exhibit": 54, "incremental_dump": 55, "illeg": 55, "hierarh": 55, "inconsist": 55, "anymor": 55, "export_predict": 55, "legaci": 55, "corner": 55, "nan": 55, "occasion": 55, "thousand": 55, "happen": 55, "cub": 55, "workaround": 55, "rmm": 55, "mr": 55, "set_current_device_resourc": 55, "356": 55, "hctr_rmm_settabl": 55, "cautiou": 55, "1g": 55, "243": 55, "kafkaproduc": 55, "succe": 55, "unrespons": 55, "reachabl": 55, "joint": 55, "suit": 55, "omit": 55, "futr": 55, "hierarchicalkv": 55, "cmakelist": 55, "minor": 55, "duse_cudart_stat": 55, "torchscript": 55, "coupl": 55, "regress": 55, "unnessari": 55, "h800": 55, "fp8": 55, "dequant": 55, "x86": 55, "superchip": 55, "hand": 55, "_concat_": 55, "dense_embed": 55, "refin": 55, "devicesegmentedsort": 55, "devicesegmentedradixsort": 55, "led": 55, "datadistributor": 55, "fly": 55, "member": 55, "elimin": 55, "parquet_reader_opt": 55, "set_num_row": 55, "pr": 55, "core23": 55, "hctr_print": 55, "did": 55, "cmak": 55, "ing": 55, "clarifi": 55, "refactor": 55, "dynamic_vari": 55, "adamax": 55, "adadelta": 55, "fault": 55, "wrong": 55, "fusion": 55, "cudadevicesynchron": 55, "embeddingtablecollect": 55, "utest": 55, "unfus": 55, "analayz": 55, "stress": 55, "crosslay": 55, "backpropag": 55, "move": 55, "denselayerswitch": 55, "unfamiliar": 55, "nic": 55, "python_interfac": 55, "strengthen": 55, "datasest": 55, "is_exclusive_kei": 55, "nob": 55, "sparseparam": 55, "misus": 55, "clearer": 55, "violat": 55, "newer": 55, "wdl_predict": 55, "januari": 55, "calendar": 55, "v23": 55, "bst": 55, "conceptu": 55, "arxiv": 55, "ab": 55, "2008": 55, "13535": 55, "redisclusterbackend": 55, "prop": 55, "test_embedding_table_optim": 55, "embedding_collect": 55, "clariti": 55, "bind": 55, "recov": 55, "sometim": 55, "problem": 55, "failur": 55, "macro": 55, "reiniti": 55, "end_offset": 55, "deeprec": 55, "embeddingplann": 55, "embedding_collection_test": 55, "db_type": 55, "boundari": 55, "hierarchc": 55, "co": 55, "round": 55, "trip": 55, "mlplayer": 55, "dgx_a100_mlp": 55, "preprocess_censu": 55, "mmoe": 55, "replicacontext": 55, "4_nvt_process": 55, "dgx_a100_ib_nvlink": 55, "dlpack": 55, "odd": 55, "sector": 55, "unreport": 55, "leak": 55, "table_group_strategi": 55, "table_placement_strategi": 55, "mmoe_parquet": 55, "simplif": 55, "mybucket": 55, "graphic": 55, "epilogu": 55, "corrupt": 55, "improp": 55, "io_block_s": 55, "max_nr_request": 55, "stabliz": 55, "globalembeddingdata": 55, "localembeddingdata": 55, "mention": 55, "bullet": 55, "ratio": 55, "subset": 55, "durat": 55, "hadoopfilesystem": 55, "hadoop_filesystem": 55, "hpp": 55, "third_parti": 55, "finer": 55, "deperac": 55, "overlapped_pipelin": 55, "triton_tf_deploi": 55, "cucollect": 55, "embedding_storag": 55, "dynamic_embedding_storag": 55, "interoper": 55, "slurm": 55, "305": 55, "482141": 55, "440781": 55, "46146124601364136": 55, "databasebackend": 55, "budget": 55, "nanosecond": 55, "strict": 55, "caller": 55, "unprocess": 55, "callback": 55, "load_dump": 55, "sst": 55, "find_tabl": 55, "discov": 55, "routin": 55, "inlin": 55, "340": 55, "concept": 55, "matrixmultipli": 55, "goal": 55, "navig": 55, "multiplex": 55, "gbp": 55, "upsert": 55, "diminish": 55, "recal": 55, "4x": 55, "rather": 55, "safer": 55, "ndcg": 55, "smape": 55, "extractor": 55, "261": 55, "inspir": 55, "roc_auc_scor": 55, "unweight": 55, "release_not": 55, "reorgan": 55, "dlrm_kaggle_fp32": 55, "36672493": 55, "301": 55, "standalon": 55, "prodvid": 55, "decoupl": 55, "realli": 55, "embedding_workspace_calcul": 55, "qa": 55, "codebas": 55, "relev": 55, "model_analyz": 55, "won": 55, "bare": 55, "notic": 55, "lessen": 55, "dlrm_benchmark": 55, "uint32_t": 55, "int64_t": 55, "uint32": 55, "all2alldenseembed": 55, "embedding_initi": 55, "randomuniform": 55, "readabl": 55, "robust": 55, "resolut": 55, "recycl": 55, "unload": 55, "invok": 55, "conda": 55, "event": 55, "notebok": 55, "inaccur": 55, "parameter": 55, "meaning": 55, "jabber": 55, "uniformli": 55, "interleav": 55, "shouldn": 55, "graphschedul": 55, "grapschedul": 55, "cudagraph": 55, "gap": 55, "adjac": 55, "grain": 55, "frozen": 55, "unfrozen": 55, "worri": 55, "gpu_cach": 55, "oversubscript": 55, "hmem": 55, "mo": 55, "use_host_memory_p": 55, "ps_type": 55, "vice": 55, "versa": 55, "famili": 55, "poc": 55, "assist": 55, "explain": 55, "involv": 55, "netwoek": 55, "fusedrelubiasfullyconnectedlay": 55, "holist": 55, "use_overlapped_pipelin": 55, "use_hash_t": 55, "multiworkermirroredstrategi": 55, "concret": 55, "ncf": 55, "gmf": 55, "neumf": 55, "dien": 55, "paraquet": 55, "moment": 55, "stand": 55, "alon": 55, "dotproduct": 55, "__half2": 55, "vocabulary_s": 55, "streamlin": 55, "grasp": 55, "embedding_plugin": 55, "localizedslotsparseembeddinghashonehot": 55, "claus": 55, "max_eval_sampl": 55, "multiplylay": 55, "weightmultiplylay": 55, "perl": 55, "embeddinglay": 55, "helper": 55, "coars": 55, "tensorfloat": 55, "mantissa": 55, "expon": 55, "redesign": 55, "multinod": 55, "hugectr_user_guid": 55, "preprocess_nvt": 55, "hasn": 55, "dl": 56, "vast": 56, "broad": 56, "balanc": 56, "littl": 56}, "objects": {"hierarchical_parameter_server": [[8, 0, 1, "", "Init"], [9, 1, 1, "", "LookupLayer"], [9, 1, 1, "", "SparseLookupLayer"]], "hierarchical_parameter_server.LookupLayer": [[9, 2, 1, "", "call"]], "hierarchical_parameter_server.SparseLookupLayer": [[9, 2, 1, "", "call"]]}, "objtypes": {"0": "py:function", "1": "py:class", "2": "py:method"}, "objnames": {"0": ["py", "function", "Python function"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"]}, "titleterms": {"question": 0, "answer": 0, "1": [0, 30, 41, 43, 54, 55], "who": 0, "ar": 0, "target": 0, "user": 0, "hugectr": [0, 2, 3, 4, 25, 29, 31, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 51, 53, 54], "2": [0, 30, 41, 43, 54, 55], "which": 0, "model": [0, 4, 5, 6, 20, 21, 22, 26, 27, 30, 31, 32, 33, 36, 40, 42, 48, 51, 53], "can": 0, "support": [0, 36], "3": [0, 30, 41, 43, 55], "doe": 0, "tensorflow": [0, 10, 24, 30, 33, 54], "4": [0, 30, 41, 43, 55], "multipl": [0, 21, 33], "node": [0, 36], "ctr": 0, "train": [0, 4, 5, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 36, 40, 41, 42, 44, 45, 51, 53], "5": [0, 30, 41, 55], "how": [0, 35], "deal": 0, "huge": 0, "embed": [0, 2, 5, 19, 22, 26, 27, 30, 40, 41, 48, 51], "tabl": [0, 19, 21, 23, 28, 30, 40], "cannot": 0, "store": [0, 49], "singl": 0, "gpu": [0, 33, 47], "memori": 0, "6": [0, 55], "7": [0, 55], "must": 0, "we": 0, "us": [0, 2, 10, 13, 17, 19, 24, 30, 31, 32, 33, 38, 40, 42], "dgx": [0, 54], "famili": 0, "a100": [0, 54], "run": [0, 30, 40, 43, 50], "8": [0, 55], "without": [0, 41], "infiniband": 0, "9": [0, 55], "i": 0, "ani": 0, "requir": 0, "cpu": 0, "configur": [0, 5, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33], "execut": [0, 5], "10": 0, "what": [0, 55], "specif": [0, 25, 29, 34, 43], "format": [0, 4, 30], "file": [0, 4, 30, 31, 32, 33, 53], "input": [0, 2, 21, 30], "11": [0, 55], "python": [0, 4], "interfac": [0, 4], "12": [0, 55], "do": [0, 30, 31, 32, 33], "synchron": 0, "otherwis": 0, "asynchron": 0, "13": 0, "stream": 0, "14": 0, "slot": 0, "15": 0, "differ": 0, "between": 0, "localizedslotembed": 0, "distributedslotembed": 0, "16": 0, "For": 0, "multi": [0, 36, 41, 44, 49, 52], "dataread": [0, 4], "read": 0, "same": 0, "batch": 0, "data": [0, 4, 28, 30, 31, 38, 40, 41, 42, 44, 46, 49, 53], "each": 0, "step": [0, 30, 45], "17": 0, "As": 0, "parallel": [0, 36], "layer": [0, 2, 4, 9, 20, 21, 22, 24, 26, 27, 33, 51], "get": [0, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 45], "all": [0, 46, 47, 48], "lookup": [0, 5, 28, 41], "featur": [0, 36, 47, 48, 49, 51], "from": [0, 20, 21, 22, 23, 24, 26, 27, 28, 30, 34, 35, 38, 41, 46, 47], "18": 0, "set": [0, 35], "claus": 0, "two": 0, "need": 0, "19": 0, "save": [0, 20, 21, 26], "load": [0, 22, 51], "20": 0, "could": 0, "post": 0, "import": 0, "other": 0, "framework": 0, "infer": [0, 4, 5, 20, 21, 23, 24, 26, 30, 35, 41], "deploy": [0, 41], "21": 0, "overlap": 0, "22": 0, "": [0, 48, 54, 55], "valu": 0, "23": [0, 55], "benchmark": [0, 6, 10, 17, 30, 38], "my": 0, "network": 0, "24": [0, 55], "workspace_size_per_gpu_in_mb": 0, "slot_size_arrai": 0, "25": 0, "nvlink": 0, "26": 0, "onli": 0, "server": [0, 5, 7, 10, 13, 17, 18, 20, 25, 29, 30, 36, 41], "27": 0, "28": 0, "pretrain": [0, 22, 47, 48, 51], "29": 0, "construct": 0, "graph": [0, 20, 21, 24, 26, 30, 31, 32, 33], "branch": 0, "topologi": 0, "30": 0, "good": 0, "practic": 0, "vector": [0, 41], "size": 0, "31": 0, "resolv": 0, "bu": 0, "error": 0, "when": 0, "sampl": 0, "notebook": [0, 10, 13, 17, 25, 29, 34, 40, 43, 52], "32": 0, "log": 0, "pool": 0, "empti": 0, "impli": 0, "addit": 1, "resourc": [1, 6, 39], "class": [2, 4, 12], "method": [2, 4], "spars": [2, 21, 32, 33, 35, 36, 56], "type": 2, "detail": 2, "distributedslotsparseembeddinghash": 2, "localizedslotsparseembeddinghash": 2, "localizedslotsparseembeddingonehot": 2, "dens": 2, "usag": 2, "fullyconnect": 2, "mlp": 2, "multicross": 2, "fmorder2": 2, "weightmultipli": 2, "elementwisemultipli": 2, "batchnorm": 2, "layernorm": 2, "concat": 2, "reshap": 2, "select": 2, "slice": 2, "dropout": 2, "elu": 2, "relu": 2, "sigmoid": 2, "interact": 2, "add": [2, 4], "reducesum": 2, "gru": 2, "preludic": 2, "scale": 2, "fusedreshapeconcat": 2, "fusedreshapeconcatgener": 2, "softmax": 2, "sub": 2, "reducemean": 2, "matrixmutipli": 2, "multiheadattent": 2, "sequencemask": 2, "gather": 2, "binarycrossentropyloss": 2, "crossentropyloss": 2, "multicrossentropyloss": 2, "collect": [2, 40, 46], "about": [2, 4, 38, 40], "overview": [2, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 44, 53], "known": [2, 55], "limit": 2, "embeddingtableconfig": 2, "embeddingcollectionconfig": 2, "embedding_lookup": 2, "shard": 2, "api": [3, 4, 7, 11, 16, 40], "document": 3, "high": 4, "level": 4, "solver": 4, "createsolv": 4, "asyncparam": 4, "hybridembeddingparam": 4, "datareaderparam": 4, "dataset": [4, 38, 45], "list": [4, 25, 29, 34, 43], "raw": 4, "parquet": 4, "optparamspi": 4, "createoptim": 4, "compil": 4, "fit": 4, "summari": [4, 36], "graph_to_json": 4, "construct_from_json": 4, "load_dense_weight": 4, "load_dense_optimizer_st": 4, "load_sparse_weight": 4, "load_sparse_optimizer_st": 4, "freeze_dens": 4, "freeze_embed": 4, "unfreeze_dens": 4, "unfreeze_embed": 4, "reset_learning_rate_schedul": 4, "set_sourc": 4, "low": 4, "learningrateschedul": 4, "get_next": 4, "is_eof": 4, "get_learning_rate_schedul": 4, "get_data_reader_train": 4, "get_data_reader_ev": 4, "start_data_read": 4, "set_learning_r": 4, "get_current_loss": 4, "eval": 4, "get_eval_metr": 4, "save_params_to_fil": 4, "check_out_tensor": 4, "inferenceparam": 4, "inferencemodel": 4, "predict": 4, "evalu": [4, 54], "gener": [4, 28, 31, 38, 41], "datageneratorparam": 4, "datagener": 4, "sourc": [4, 5, 35], "datasourceparam": 4, "hierarch": [5, 7, 10, 13, 17, 18, 20, 25, 29, 36, 41], "paramet": [5, 7, 10, 13, 17, 18, 20, 25, 29, 36, 41], "databas": 5, "backend": [5, 24], "introduct": [5, 10, 13, 17, 38], "hp": [5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 34, 41], "background": 5, "architectur": 5, "iter": 5, "updat": 5, "optim": [5, 36], "cach": 5, "param": 5, "syntax": 5, "volatil": 5, "overflow": 5, "common": 5, "persist": 5, "dlrm": [6, 26, 27, 40, 53], "setup": [6, 40, 41, 42, 53], "result": [6, 19], "initi": 8, "sparselookuplay": [9, 21, 26], "lookuplay": [9, 12, 20, 21, 24], "plugin": [10, 11, 12, 13, 14, 15, 16, 17, 30, 31, 32, 33, 34], "benefit": 10, "workflow": [10, 17], "instal": [10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38], "comput": [10, 13, 17, 38], "capabl": [10, 13, 17, 38], "ngc": [10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 43], "contain": [10, 13, 17, 30, 34, 35, 38], "exampl": [10, 13, 17, 42, 43, 52, 53], "torch": [11, 12, 13, 28], "creator": 15, "tensorrt": [16, 17, 30, 31, 32, 33, 34], "profil": 19, "build": [19, 27, 30, 31, 32, 33, 35, 38, 43], "creat": [19, 20, 21, 23, 24, 26, 30, 49], "synthet": [19, 38, 49], "measur": 19, "triton": [19, 24, 30, 31, 32, 33], "perf": 19, "analyz": 19, "v": 19, "demo": [20, 22, 23, 26, 27, 28, 31, 32, 33, 41], "nativ": [20, 21, 22, 24, 33], "tf": [20, 21, 22, 23, 24, 30, 33], "pre": [22, 50, 51], "via": 22, "fusion": [23, 28], "savedmodel": [23, 24], "make": 23, "deploi": [24, 31, 32, 33], "trt": 24, "quickstart": [25, 29, 34], "pull": [25, 29, 34, 43], "docker": [25, 29, 30, 43], "clone": [25, 29, 34, 43], "repositori": [25, 29, 30, 34, 43], "start": [25, 29, 34, 35, 43, 45], "jupyt": [25, 29, 34, 43], "system": [25, 29, 30, 34, 43, 44, 53], "sok": [26, 27, 35], "larg": 30, "integr": [30, 31, 32, 33], "engin": [30, 31, 32, 33], "step1": [30, 31, 32, 33], "prepar": [30, 31, 32, 33, 40, 42, 53], "147gb": 30, "scratch": [30, 38, 41], "step2": [30, 31, 32, 33], "json": [30, 31, 32, 33], "step3": [30, 31, 32, 33], "convert": [30, 31, 32, 33, 36, 41, 45], "onnx": [30, 31, 32, 33, 36, 41], "surgeri": [30, 31, 32, 33], "step4": 30, "launch": 30, "arm64": 30, "grace": 30, "hooper": 30, "nvidia": [30, 47], "merlin": [30, 35, 39], "imag": 30, "host": 30, "pytorch": 32, "contribut": 35, "new": [35, 55], "code": 35, "your": 35, "develop": 35, "up": 35, "environ": 35, "With": 35, "oper": [35, 36, 56], "kit": [35, 36, 56], "core": 36, "mix": 36, "precis": 36, "sgd": 36, "learn": 36, "rate": 36, "schedul": 36, "hdf": [36, 53], "talk": 37, "blog": 37, "tool": 38, "download": [38, 45, 47, 48], "preprocess": [38, 42, 50], "relat": 39, "thi": 40, "concept": 40, "refer": 40, "an": 40, "follow": 40, "command": 40, "termin": 40, "script": 40, "placement": 40, "strategi": 40, "round": 40, "robin": 40, "uniform": 40, "hybrid": 40, "dynam": 40, "hash": 40, "dlpack": 41, "process": [41, 50], "redi": 41, "cluster": 41, "tl": 41, "ssl": 41, "end": 42, "nvtabular": [42, 50], "wdl": 42, "custom": 43, "option": 43, "recommend": 44, "modal": [44, 49, 52], "movielen": [45, 46], "25m": 45, "split": 45, "valid": 45, "next": 45, "enrich": 46, "scrape": 46, "imdb": 46, "synopsi": [46, 48], "movi": [46, 47, 48, 49, 51], "poster": [46, 47], "extract": [47, 48], "resnet": 47, "50": 47, "cloud": [47, 53], "bart": 48, "text": 48, "summar": 48, "real": 49, "etl": 50, "defin": [50, 51], "our": 50, "pipelin": 50, "check": 50, "output": 50, "non": 51, "trainabl": 51, "remot": 53, "dcn": 53, "aw": 53, "s3": 53, "googl": 53, "storag": 53, "perform": 54, "mlperf": 54, "releas": 55, "note": 55, "version": 55, "06": 55, "08": 55, "04": 55, "02": 55, "0": 55, "issu": 55}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx.ext.intersphinx": 1, "sphinx": 57}, "alltitles": {"Questions and Answers": [[0, "questions-and-answers"]], "1. Who are the target users of HugeCTR?": [[0, "who-are-the-target-users-of-hugectr"]], "2. Which models can be supported in HugeCTR?": [[0, "which-models-can-be-supported-in-hugectr"]], "3. Does HugeCTR support TensorFlow?": [[0, "does-hugectr-support-tensorflow"]], "4. Does HugeCTR support multiple nodes CTR training?": [[0, "does-hugectr-support-multiple-nodes-ctr-training"]], "5. How to deal with the huge embedding table that cannot be stored in a single GPU memory?": [[0, "how-to-deal-with-the-huge-embedding-table-that-cannot-be-stored-in-a-single-gpu-memory"]], "6. Which GPUs are supported in HugeCTR?": [[0, "which-gpus-are-supported-in-hugectr"]], "7. Must we use the DGX family such as DGX A100 to run HugeCTR?": [[0, "must-we-use-the-dgx-family-such-as-dgx-a100-to-run-hugectr"]], "8. Can HugeCTR run without InfiniBand?": [[0, "can-hugectr-run-without-infiniband"]], "9. Is there any requirement of CPU configuration for HugeCTR execution?": [[0, "is-there-any-requirement-of-cpu-configuration-for-hugectr-execution"]], "10. What is the specific format of files as input in HugeCTR?": [[0, "what-is-the-specific-format-of-files-as-input-in-hugectr"]], "11.\t Does HugeCTR support Python interface?": [[0, "does-hugectr-support-python-interface"]], "12. Does HugeCTR do synchronous training with multiple GPUs (and nodes)? Otherwise, does it do asynchronous training?": [[0, "does-hugectr-do-synchronous-training-with-multiple-gpus-and-nodes-otherwise-does-it-do-asynchronous-training"]], "13. Does HugeCTR support stream training?": [[0, "does-hugectr-support-stream-training"]], "14. What is a \u201cslot\u201d in HugeCTR?": [[0, "what-is-a-slot-in-hugectr"]], "15. What are the differences between LocalizedSlotEmbedding and DistributedSlotEmbedding?": [[0, "what-are-the-differences-between-localizedslotembedding-and-distributedslotembedding"]], "16. For multi-node\uff0cis DataReader required to read the same batch of data on each node for each step?": [[0, "for-multi-node-is-datareader-required-to-read-the-same-batch-of-data-on-each-node-for-each-step"]], "17. As model parallelism in embedding layers, how does it get all the embedding lookup features from multi-node / multi-gpu?": [[0, "as-model-parallelism-in-embedding-layers-how-does-it-get-all-the-embedding-lookup-features-from-multi-node-multi-gpu"]], "18. How to set data clauses, if there are two embeddings needed?": [[0, "how-to-set-data-clauses-if-there-are-two-embeddings-needed"]], "19. How to save and load models in HugeCTR?": [[0, "how-to-save-and-load-models-in-hugectr"]], "20. Could the post training model from HugeCTR be imported into other frameworks such as TensorFlow for inference deployment?": [[0, "could-the-post-training-model-from-hugectr-be-imported-into-other-frameworks-such-as-tensorflow-for-inference-deployment"]], "21. Does HugeCTR support overlap between different slots?": [[0, "does-hugectr-support-overlap-between-different-slots"]], "22. What if there\u2019s no value in a slot?": [[0, "what-if-there-s-no-value-in-a-slot"]], "23. How can I benchmark my network?": [[0, "how-can-i-benchmark-my-network"]], "24. How to set workspace_size_per_gpu_in_mb and slot_size_array?": [[0, "how-to-set-workspace-size-per-gpu-in-mb-and-slot-size-array"]], "25. Is nvlink required in HugeCTR?": [[0, "is-nvlink-required-in-hugectr"]], "26. Is DGX the only GPU server that is required in HugeCTR?": [[0, "is-dgx-the-only-gpu-server-that-is-required-in-hugectr"]], "27. Can HugeCTR run without InfiniBand?": [[0, "id1"]], "28. Does HugeCTR support loading pretrained embeddings in other formats?": [[0, "does-hugectr-support-loading-pretrained-embeddings-in-other-formats"]], "29. How to construct the model graph with branch topology in HugeCTR?": [[0, "how-to-construct-the-model-graph-with-branch-topology-in-hugectr"]], "30. What is the good practice of configuring the embedding vector size?": [[0, "what-is-the-good-practice-of-configuring-the-embedding-vector-size"]], "31. How to resolve the bus error when running HugeCTR samples and notebooks?": [[0, "how-to-resolve-the-bus-error-when-running-hugectr-samples-and-notebooks"]], "32. What does the log \u201cmemory pool is empty\u201d imply for HugeCTR inference?": [[0, "what-does-the-log-memory-pool-is-empty-imply-for-hugectr-inference"]], "Additional Resources": [[1, "additional-resources"]], "HugeCTR Layer Classes and Methods": [[2, "hugectr-layer-classes-and-methods"]], "Input Layer": [[2, "input-layer"]], "Sparse Embedding": [[2, "sparse-embedding"]], "Embedding Types Detail": [[2, "embedding-types-detail"]], "DistributedSlotSparseEmbeddingHash Layer": [[2, "distributedslotsparseembeddinghash-layer"]], "LocalizedSlotSparseEmbeddingHash Layer": [[2, "localizedslotsparseembeddinghash-layer"]], "LocalizedSlotSparseEmbeddingOneHot Layer": [[2, "localizedslotsparseembeddingonehot-layer"]], "Dense Layers": [[2, "dense-layers"]], "Dense Layers Usage": [[2, "dense-layers-usage"]], "FullyConnected Layer": [[2, "fullyconnected-layer"]], "MLP Layer": [[2, "mlp-layer"]], "MultiCross Layer": [[2, "multicross-layer"]], "FmOrder2 Layer": [[2, "fmorder2-layer"]], "WeightMultiply Layer": [[2, "weightmultiply-layer"]], "ElementwiseMultiply Layer": [[2, "elementwisemultiply-layer"]], "BatchNorm Layer": [[2, "batchnorm-layer"]], "LayerNorm Layer": [[2, "layernorm-layer"]], "Concat Layer": [[2, "concat-layer"]], "Reshape Layer": [[2, "reshape-layer"]], "Select Layer": [[2, "select-layer"]], "Slice Layer": [[2, "slice-layer"]], "Dropout Layer": [[2, "dropout-layer"]], "ELU Layer": [[2, "elu-layer"]], "ReLU Layer": [[2, "relu-layer"]], "Sigmoid Layer": [[2, "sigmoid-layer"]], "Interaction Layer": [[2, "interaction-layer"]], "Add Layer": [[2, "add-layer"]], "ReduceSum Layer": [[2, "reducesum-layer"]], "GRU Layer": [[2, "gru-layer"]], "PReLUDice Layer": [[2, "preludice-layer"]], "Scale Layer": [[2, "scale-layer"]], "FusedReshapeConcat Layer": [[2, "fusedreshapeconcat-layer"]], "FusedReshapeConcatGeneral Layer": [[2, "fusedreshapeconcatgeneral-layer"]], "Softmax Layer": [[2, "softmax-layer"]], "Sub Layer": [[2, "sub-layer"]], "ReduceMean Layer": [[2, "reducemean-layer"]], "MatrixMutiply Layer": [[2, "matrixmutiply-layer"]], "MultiHeadAttention Layer": [[2, "multiheadattention-layer"]], "SequenceMask Layer": [[2, "sequencemask-layer"]], "Gather Layer": [[2, "gather-layer"]], "BinaryCrossEntropyLoss": [[2, "binarycrossentropyloss"]], "CrossEntropyLoss": [[2, "crossentropyloss"]], "MultiCrossEntropyLoss": [[2, "multicrossentropyloss"]], "Embedding Collection": [[2, "embedding-collection"]], "About the HugeCTR embedding collection": [[2, "about-the-hugectr-embedding-collection"]], "Overview of using the HugeCTR embedding collection": [[2, "overview-of-using-the-hugectr-embedding-collection"]], "Known Limitations": [[2, "known-limitations"]], "EmbeddingTableConfig": [[2, "embeddingtableconfig"]], "EmbeddingCollectionConfig": [[2, "embeddingcollectionconfig"]], "embedding_lookup method": [[2, "embedding-lookup-method"]], "shard method": [[2, "shard-method"]], "HugeCTR API Documentation": [[3, "hugectr-api-documentation"]], "HugeCTR Python Interface": [[4, "hugectr-python-interface"]], "About the HugeCTR Python Interface": [[4, "about-the-hugectr-python-interface"]], "High-level Training API": [[4, "high-level-training-api"]], "Solver": [[4, "solver"]], "CreateSolver method": [[4, "createsolver-method"]], "AsyncParam": [[4, "asyncparam"]], "AsyncParam class": [[4, "asyncparam-class"]], "HybridEmbeddingParam": [[4, "hybridembeddingparam"]], "HybridEmbeddingParam class": [[4, "hybridembeddingparam-class"]], "DataReaderParams": [[4, "datareaderparams"]], "DataReaderParams class": [[4, "datareaderparams-class"]], "Dataset formats": [[4, "dataset-formats"]], "Data Files": [[4, "data-files"]], "File List": [[4, "file-list"]], "Raw": [[4, "raw"]], "Parquet": [[4, "parquet"]], "OptParamsPy": [[4, "optparamspy"]], "CreateOptimizer method": [[4, "createoptimizer-method"]], "Layers": [[4, "layers"]], "Model": [[4, "model"], [4, "id2"]], "Model class": [[4, "model-class"]], "add method": [[4, "add-method"]], "compile method": [[4, "compile-method"]], "fit method": [[4, "fit-method"]], "summary method": [[4, "summary-method"]], "graph_to_json method": [[4, "graph-to-json-method"]], "construct_from_json method": [[4, "construct-from-json-method"]], "load_dense_weights method": [[4, "load-dense-weights-method"]], "load_dense_optimizer_states method": [[4, "load-dense-optimizer-states-method"]], "load_sparse_weights method": [[4, "load-sparse-weights-method"]], "load_sparse_optimizer_states method": [[4, "load-sparse-optimizer-states-method"]], "freeze_dense method": [[4, "freeze-dense-method"]], "freeze_embedding method": [[4, "freeze-embedding-method"]], "unfreeze_dense method": [[4, "unfreeze-dense-method"]], "unfreeze_embedding method": [[4, "unfreeze-embedding-method"]], "reset_learning_rate_scheduler method": [[4, "reset-learning-rate-scheduler-method"]], "set_source method": [[4, "set-source-method"], [4, "id1"]], "Low-level Training API": [[4, "low-level-training-api"]], "LearningRateScheduler": [[4, "learningratescheduler"]], "get_next method": [[4, "get-next-method"]], "DataReader": [[4, "datareader"]], "is_eof method": [[4, "is-eof-method"]], "get_learning_rate_scheduler method": [[4, "get-learning-rate-scheduler-method"]], "get_data_reader_train method": [[4, "get-data-reader-train-method"]], "get_data_reader_eval method": [[4, "get-data-reader-eval-method"]], "start_data_reading method": [[4, "start-data-reading-method"]], "set_learning_rate method": [[4, "set-learning-rate-method"]], "train method": [[4, "train-method"]], "get_current_loss method": [[4, "get-current-loss-method"]], "eval method": [[4, "eval-method"]], "get_eval_metrics method": [[4, "get-eval-metrics-method"]], "save_params_to_files method": [[4, "save-params-to-files-method"]], "check_out_tensor method": [[4, "check-out-tensor-method"], [4, "id3"]], "Inference API": [[4, "inference-api"]], "InferenceParams": [[4, "inferenceparams"]], "InferenceParams class": [[4, "inferenceparams-class"]], "InferenceModel": [[4, "inferencemodel"]], "InferenceModel class": [[4, "inferencemodel-class"]], "predict method": [[4, "predict-method"]], "evaluate method": [[4, "evaluate-method"]], "Data Generator API": [[4, "data-generator-api"]], "DataGeneratorParams class": [[4, "datageneratorparams-class"]], "DataGenerator": [[4, "datagenerator"]], "DataGenerator class": [[4, "datagenerator-class"]], "generate method": [[4, "generate-method"]], "Data Source API": [[4, "data-source-api"]], "DataSourceParams class": [[4, "datasourceparams-class"]], "Hierarchical Parameter Server Database Backend": [[5, "hierarchical-parameter-server-database-backend"]], "Introduction to the HPS Database Backend": [[5, "introduction-to-the-hps-database-backend"]], "Background": [[5, "background"]], "Architecture": [[5, "architecture"]], "Training and Iterative Model Updates": [[5, "training-and-iterative-model-updates"]], "Execution": [[5, "execution"]], "Inference": [[5, "inference"]], "Training": [[5, "training"], [53, "training"], [53, "id3"]], "Lookup Optimization": [[5, "lookup-optimization"]], "Configuration": [[5, "configuration"]], "Inference Parameters and Embedding Cache Configuration": [[5, "inference-parameters-and-embedding-cache-configuration"]], "Inference Params Syntax": [[5, "inference-params-syntax"]], "Inference Parameters": [[5, "inference-parameters"]], "Parameter Server Configuration: Models": [[5, "parameter-server-configuration-models"]], "Volatile Database Configuration": [[5, "volatile-database-configuration"]], "Volatile Database Params Syntax": [[5, "volatile-database-params-syntax"]], "Parameter Server Configuration: Volatile Database": [[5, "parameter-server-configuration-volatile-database"]], "Volatile Database Parameters": [[5, "volatile-database-parameters"]], "Overflow Parameters": [[5, "overflow-parameters"]], "Common Volatile Database Parameters": [[5, "common-volatile-database-parameters"]], "Persistent Database Configuration": [[5, "persistent-database-configuration"]], "Persistent Database Params Syntax": [[5, "persistent-database-params-syntax"]], "Parameter Server Configuration: Persistent Database": [[5, "parameter-server-configuration-persistent-database"]], "Persistent Database Parameters": [[5, "persistent-database-parameters"]], "Update Source Configuration": [[5, "update-source-configuration"]], "Update Source Params Syntax": [[5, "update-source-params-syntax"]], "Parameter Server Configuration: Update Source": [[5, "parameter-server-configuration-update-source"]], "Update Source Parameters": [[5, "update-source-parameters"]], "Benchmark the DLRM Model with HPS": [[6, "benchmark-the-dlrm-model-with-hps"]], "Benchmark Setup": [[6, "benchmark-setup"]], "Results": [[6, "results"]], "Resources": [[6, "resources"]], "Hierarchical Parameter Server API": [[7, "hierarchical-parameter-server-api"]], "HPS Initialize": [[8, "hps-initialize"]], "HPS Layers": [[9, "hps-layers"]], "SparseLookupLayer": [[9, "sparselookuplayer"]], "LookupLayer": [[9, "lookuplayer"]], "Hierarchical Parameter Server Plugin for TensorFlow": [[10, "hierarchical-parameter-server-plugin-for-tensorflow"]], "Introduction to the HPS Plugin for TensorFlow": [[10, "introduction-to-the-hps-plugin-for-tensorflow"]], "Benefits of the Plugin for TensorFlow": [[10, "benefits-of-the-plugin-for-tensorflow"]], "Workflow": [[10, "workflow"], [17, "workflow"]], "Installation": [[10, "installation"], [13, "installation"], [17, "installation"], [20, "installation"], [21, "installation"], [22, "installation"], [23, "installation"], [24, "installation"], [26, "installation"], [27, "installation"], [28, "installation"], [30, "installation"], [31, "installation"], [32, "installation"], [33, "installation"]], "Compute Capability": [[10, "compute-capability"], [13, "compute-capability"], [17, "compute-capability"], [38, "compute-capability"]], "Installing HPS Using NGC Containers": [[10, "installing-hps-using-ngc-containers"], [13, "installing-hps-using-ngc-containers"], [17, "installing-hps-using-ngc-containers"]], "Example Notebooks": [[10, "example-notebooks"], [13, "example-notebooks"], [17, "example-notebooks"]], "Benchmark": [[10, "benchmark"], [17, "benchmark"]], "HPS Plugin for Torch API": [[11, "hps-plugin-for-torch-api"]], "HPS Plugin for Torch": [[12, "hps-plugin-for-torch"]], "LookupLayer class": [[12, "lookuplayer-class"]], "Hierarchical Parameter Server Plugin for Torch": [[13, "hierarchical-parameter-server-plugin-for-torch"]], "Introduction to the HPS Plugin for Torch": [[13, "introduction-to-the-hps-plugin-for-torch"]], "HPS Plugin": [[14, "hps-plugin"]], "HPS Plugin Creator": [[15, "hps-plugin-creator"]], "HPS Plugin for TensorRT API": [[16, "hps-plugin-for-tensorrt-api"]], "Hierarchical Parameter Server Plugin for TensorRT": [[17, "hierarchical-parameter-server-plugin-for-tensorrt"]], "Introduction to the HPS Plugin for TensorRT": [[17, "introduction-to-the-hps-plugin-for-tensorrt"]], "Hierarchical Parameter Server": [[18, "hierarchical-parameter-server"], [36, "hierarchical-parameter-server"]], "Profiling HPS": [[19, "profiling-hps"]], "HPS profiler": [[19, "hps-profiler"]], "Build and install the HPS Profiler": [[19, "build-and-install-the-hps-profiler"]], "Create a synthetic embedding table": [[19, "create-a-synthetic-embedding-table"]], "Use the HPS Profiler to get the measurement results": [[19, "use-the-hps-profiler-to-get-the-measurement-results"]], "Profile HPS with Triton Perf Analyzer:": [[19, "profile-hps-with-triton-perf-analyzer"]], "HPS Profiler vs. Triton Perf Analyzer:": [[19, "hps-profiler-vs-triton-perf-analyzer"]], "Hierarchical Parameter Server Demo": [[20, "hierarchical-parameter-server-demo"], [41, "hierarchical-parameter-server-demo"]], "Overview": [[20, "overview"], [21, "overview"], [22, "overview"], [23, "overview"], [24, "overview"], [26, "overview"], [27, "overview"], [28, "overview"], [30, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [41, "overview"], [42, "overview"], [44, "overview"], [53, "overview"]], "Get HPS from NGC": [[20, "get-hps-from-ngc"], [21, "get-hps-from-ngc"], [22, "get-hps-from-ngc"], [23, "get-hps-from-ngc"], [24, "get-hps-from-ngc"], [28, "get-hps-from-ngc"]], "Configurations": [[20, "configurations"], [21, "configurations"], [22, "configurations"], [24, "configurations"], [26, "configurations"], [27, "configurations"], [32, "configurations"], [33, "configurations"]], "Train with native TF layers": [[20, "train-with-native-tf-layers"], [21, "train-with-native-tf-layers"], [22, "train-with-native-tf-layers"], [24, "train-with-native-tf-layers"], [33, "train-with-native-tf-layers"]], "Create the inference graph with HPS LookupLayer": [[20, "create-the-inference-graph-with-hps-lookuplayer"], [24, "create-the-inference-graph-with-hps-lookuplayer"]], "Inference with saved model graph": [[20, "inference-with-saved-model-graph"], [21, "inference-with-saved-model-graph"], [26, "inference-with-saved-model-graph"]], "HPS for Multiple Tables and Sparse Inputs": [[21, "hps-for-multiple-tables-and-sparse-inputs"]], "Create the inference graph with HPS SparseLookupLayer and LookupLayer": [[21, "create-the-inference-graph-with-hps-sparselookuplayer-and-lookuplayer"]], "HPS Pretrained Model Training Demo": [[22, "hps-pretrained-model-training-demo"]], "Load the pre-trained embeddings via HPS": [[22, "load-the-pre-trained-embeddings-via-hps"]], "HPS Table Fusion Demo": [[23, "hps-table-fusion-demo"]], "Create TF SavedModel": [[23, "create-tf-savedmodel"]], "Make inference with HPS table fusion": [[23, "make-inference-with-hps-table-fusion"]], "Deploy SavedModel using HPS with Triton TensorFlow Backend": [[24, "deploy-savedmodel-using-hps-with-triton-tensorflow-backend"], [24, "id1"]], "Deploy TF-TRT SavedModel using HPS with Triton TensorFlow Backend": [[24, "deploy-tf-trt-savedmodel-using-hps-with-triton-tensorflow-backend"]], "Hierarchical Parameter Server Notebooks": [[25, "hierarchical-parameter-server-notebooks"], [29, "hierarchical-parameter-server-notebooks"]], "Quickstart": [[25, "quickstart"], [29, "quickstart"], [34, "quickstart"]], "Pull the NGC Docker": [[25, "pull-the-ngc-docker"], [29, "pull-the-ngc-docker"]], "Clone the HugeCTR Repository": [[25, "clone-the-hugectr-repository"], [29, "clone-the-hugectr-repository"], [34, "clone-the-hugectr-repository"]], "Start the Jupyter Notebook": [[25, "start-the-jupyter-notebook"], [29, "start-the-jupyter-notebook"], [34, "start-the-jupyter-notebook"]], "Notebook List": [[25, "notebook-list"], [29, "notebook-list"], [34, "notebook-list"], [43, "notebook-list"]], "System Specifications": [[25, "system-specifications"], [29, "system-specifications"], [34, "system-specifications"], [43, "system-specifications"]], "SOK to HPS DLRM Demo": [[26, "sok-to-hps-dlrm-demo"]], "Get SOK from NGC": [[26, "get-sok-from-ngc"], [27, "get-sok-from-ngc"]], "Train with SOK embedding layers": [[26, "train-with-sok-embedding-layers"]], "Create the inference graph with HPS SparseLookupLayer": [[26, "create-the-inference-graph-with-hps-sparselookuplayer"]], "SOK Train DLRM Demo": [[27, "sok-train-dlrm-demo"]], "Build model with SOK embedding layers": [[27, "build-model-with-sok-embedding-layers"]], "Train with SOK models": [[27, "train-with-sok-models"]], "HPS Torch Demo": [[28, "hps-torch-demo"]], "Data Generation": [[28, "data-generation"], [31, "data-generation"], [41, "data-generation"]], "Lookup with Table Fusion": [[28, "lookup-with-table-fusion"]], "HPS TensorRT Plugin Benchmark for TensorFlow Large Model": [[30, "hps-tensorrt-plugin-benchmark-for-tensorflow-large-model"]], "Use NGC": [[30, "use-ngc"], [31, "use-ngc"], [32, "use-ngc"], [33, "use-ngc"]], "1. Create the TF model": [[30, "create-the-tf-model"]], "2. Build the HPS-integrated TensorRT engine": [[30, "build-the-hps-integrated-tensorrt-engine"]], "Step1: Prepare the 147GB embedding table": [[30, "step1-prepare-the-147gb-embedding-table"]], "1.1 Train a 147GB model from scratch": [[30, "train-a-147gb-model-from-scratch"]], "1.2 Get the embedding model file in hps format": [[30, "get-the-embedding-model-file-in-hps-format"]], "Step2: Prepare JSON configuration file for HPS": [[30, "step2-prepare-json-configuration-file-for-hps"]], "Step3: Convert to ONNX and do ONNX graph surgery": [[30, "step3-convert-to-onnx-and-do-onnx-graph-surgery"]], "Step4: Build the TensorRT engine": [[30, "step4-build-the-tensorrt-engine"]], "3. Benchmark HPS-integrated TensorRT engine on Triton": [[30, "benchmark-hps-integrated-tensorrt-engine-on-triton"]], "Step1: Create the model repository": [[30, "step1-create-the-model-repository"]], "Step2: Prepare the benchmark input data": [[30, "step2-prepare-the-benchmark-input-data"]], "Step3: Launch the Triton inference server": [[30, "step3-launch-the-triton-inference-server"]], "Step4: Run the benchmark": [[30, "step4-run-the-benchmark"]], "4. Benchmark for ARM64 or Grace + Hooper systems": [[30, "benchmark-for-arm64-or-grace-hooper-systems"]], "Step 1: Build the NVIDIA Merlin docker images": [[30, "step-1-build-the-nvidia-merlin-docker-images"]], "Step 2: Prepare host system for running the docker container": [[30, "step-2-prepare-host-system-for-running-the-docker-container"]], "Step 3: Create the model": [[30, "step-3-create-the-model"]], "Step 4: Prepare data": [[30, "step-4-prepare-data"]], "Step 5: Run benchmark": [[30, "step-5-run-benchmark"]], "HPS TensorRT Plugin Demo for HugeCTR Trained Model": [[31, "hps-tensorrt-plugin-demo-for-hugectr-trained-model"]], "Train with HugeCTR": [[31, "train-with-hugectr"]], "Build the HPS-integrated TensorRT engine": [[31, "build-the-hps-integrated-tensorrt-engine"], [32, "build-the-hps-integrated-tensorrt-engine"], [33, "build-the-hps-integrated-tensorrt-engine"]], "Step1: Prepare JSON configuration file for HPS": [[31, "step1-prepare-json-configuration-file-for-hps"]], "Step2: Convert to ONNX and do ONNX graph surgery": [[31, "step2-convert-to-onnx-and-do-onnx-graph-surgery"], [32, "step2-convert-to-onnx-and-do-onnx-graph-surgery"], [33, "step2-convert-to-onnx-and-do-onnx-graph-surgery"]], "Step3: Build the TensorRT engine": [[31, "step3-build-the-tensorrt-engine"], [32, "step3-build-the-tensorrt-engine"], [33, "step3-build-the-tensorrt-engine"]], "Deploy HPS-integrated TensorRT engine on Triton": [[31, "deploy-hps-integrated-tensorrt-engine-on-triton"], [32, "deploy-hps-integrated-tensorrt-engine-on-triton"]], "HPS TensorRT Plugin Demo for PyTorch Trained Model": [[32, "hps-tensorrt-plugin-demo-for-pytorch-trained-model"]], "Train with PyTorch": [[32, "train-with-pytorch"]], "Step1: Prepare sparse model and JSON configuration file for HPS": [[32, "step1-prepare-sparse-model-and-json-configuration-file-for-hps"], [33, "step1-prepare-sparse-model-and-json-configuration-file-for-hps"]], "HPS TensorRT Plugin Demo for TensorFlow Trained Model": [[33, "hps-tensorrt-plugin-demo-for-tensorflow-trained-model"]], "Deploy HPS-integrated TensorRT engine with Triton on multiple GPUs": [[33, "deploy-hps-integrated-tensorrt-engine-with-triton-on-multiple-gpus"]], "HPS Plugin for TensorRT Notebooks": [[34, "hps-plugin-for-tensorrt-notebooks"]], "Pull the Container from NGC": [[34, "pull-the-container-from-ngc"]], "Contributing to HugeCTR": [[35, "contributing-to-hugectr"]], "Overview of Contributing to HugeCTR": [[35, "overview-of-contributing-to-hugectr"]], "Contribute New Code": [[35, "contribute-new-code"]], "How to Start your Development": [[35, "how-to-start-your-development"]], "Set Up the Development Environment With Merlin Containers": [[35, "set-up-the-development-environment-with-merlin-containers"]], "Build HugeCTR Training Container from Source": [[35, "build-hugectr-training-container-from-source"]], "Build HugeCTR Inference Container from Source": [[35, "build-hugectr-inference-container-from-source"]], "Build Sparse Operation Kit (SOK) from Source": [[35, "build-sparse-operation-kit-sok-from-source"]], "HugeCTR Core Features": [[36, "hugectr-core-features"]], "Summary of Core Features": [[36, "summary-of-core-features"]], "Model Parallel Training": [[36, "model-parallel-training"]], "Multi-Node Training": [[36, "multi-node-training"]], "Mixed Precision Training": [[36, "mixed-precision-training"]], "SGD Optimizer and Learning Rate Scheduling": [[36, "sgd-optimizer-and-learning-rate-scheduling"]], "HugeCTR to ONNX Converter": [[36, "hugectr-to-onnx-converter"]], "HDFS Support": [[36, "hdfs-support"]], "Sparse Operation Kit": [[36, "sparse-operation-kit"], [56, "sparse-operation-kit"]], "HugeCTR Talks and Blogs": [[37, "hugectr-talks-and-blogs"]], "Talks": [[37, "talks"]], "Blogs": [[37, "blogs"]], "Introduction to HugeCTR": [[38, "introduction-to-hugectr"]], "About HugeCTR": [[38, "about-hugectr"]], "Installing and Building HugeCTR": [[38, "installing-and-building-hugectr"]], "Installing HugeCTR Using NGC Containers": [[38, "installing-hugectr-using-ngc-containers"]], "Building HugeCTR from Scratch": [[38, "building-hugectr-from-scratch"]], "Tools": [[38, "tools"]], "Generating Synthetic Data and Benchmarks": [[38, "generating-synthetic-data-and-benchmarks"]], "Downloading and Preprocessing Datasets": [[38, "downloading-and-preprocessing-datasets"]], "Merlin HugeCTR": [[39, "merlin-hugectr"]], "Related Resources": [[39, "related-resources"]], "HugeCTR Embedding Collection": [[40, "hugectr-embedding-collection"]], "About this Notebook": [[40, "about-this-notebook"]], "Concepts and API Reference": [[40, "concepts-and-api-reference"]], "Setup": [[40, "setup"], [41, "setup"], [42, "setup"]], "Use an Embedding Collection with a DLRM Model": [[40, "use-an-embedding-collection-with-a-dlrm-model"]], "Data Preparation": [[40, "data-preparation"], [42, "data-preparation"], [53, "data-preparation"]], "Run the following commands on the terminal to prepare the data for this notebook": [[40, "run-the-following-commands-on-the-terminal-to-prepare-the-data-for-this-notebook"]], "Prepare the Training Script": [[40, "prepare-the-training-script"]], "Embedding Table Placement Strategy: Round Robin": [[40, "embedding-table-placement-strategy-round-robin"]], "Embedding Table Placement Strategy: Uniform": [[40, "embedding-table-placement-strategy-uniform"]], "Embedding Table Placement Strategy: Hybrid": [[40, "embedding-table-placement-strategy-hybrid"]], "Use Dynamic Hash Table with Round Robin Table Placement Strategy": [[40, "use-dynamic-hash-table-with-round-robin-table-placement-strategy"]], "Train from Scratch": [[41, "train-from-scratch"]], "Convert HugeCTR to ONNX": [[41, "convert-hugectr-to-onnx"]], "1. Inference with HPS & ONNX": [[41, "inference-with-hps-onnx"]], "2. Lookup the Embedding Vector from DLPack": [[41, "lookup-the-embedding-vector-from-dlpack"]], "3. Multi-process inference": [[41, "multi-process-inference"]], "4. Redis Cluster deployment (without TLS/SSL)": [[41, "redis-cluster-deployment-without-tls-ssl"]], "5. Redis Cluster deployment (with TLS/SSL)": [[41, "redis-cluster-deployment-with-tls-ssl"]], "HugeCTR End-end Example with NVTabular": [[42, "hugectr-end-end-example-with-nvtabular"]], "Data Preprocessing using NVTabular": [[42, "data-preprocessing-using-nvtabular"]], "Training a WDL model with HugeCTR": [[42, "training-a-wdl-model-with-hugectr"]], "HugeCTR Example Notebooks": [[43, "hugectr-example-notebooks"]], "1. Clone the HugeCTR Repository": [[43, "clone-the-hugectr-repository"]], "2. Pull the NGC Docker and run it": [[43, "pull-the-ngc-docker-and-run-it"]], "3. Customized Building (Optional)": [[43, "customized-building-optional"]], "4. Start the Jupyter Notebook": [[43, "start-the-jupyter-notebook"]], "Training Recommender Systems on Multi-modal Data": [[44, "training-recommender-systems-on-multi-modal-data"]], "MovieLens-25M: Download and Convert": [[45, "movielens-25m-download-and-convert"]], "Getting Started": [[45, "getting-started"]], "Convert the dataset": [[45, "convert-the-dataset"]], "Splitting into train and validation dataset": [[45, "splitting-into-train-and-validation-dataset"]], "Next steps": [[45, "next-steps"]], "MovieLens Data Enrichment": [[46, "movielens-data-enrichment"]], "Scraping data from IMDB": [[46, "scraping-data-from-imdb"]], "Collect synopsis for all movies": [[46, "collect-synopsis-for-all-movies"]], "Scraping movie posters": [[46, "scraping-movie-posters"]], "Movie Poster Feature Extraction with ResNet": [[47, "movie-poster-feature-extraction-with-resnet"]], "Download a pretrained ResNet-50 from NVIDIA GPU cloud": [[47, "download-a-pretrained-resnet-50-from-nvidia-gpu-cloud"]], "Extract features for all movies": [[47, "extract-features-for-all-movies"]], "Movie Synopsis Feature Extraction with Bart text summarization": [[48, "movie-synopsis-feature-extraction-with-bart-text-summarization"]], "Download pretrained BART model": [[48, "download-pretrained-bart-model"]], "Extracting embeddings for all movie\u2019s synopsis": [[48, "extracting-embeddings-for-all-movie-s-synopsis"]], "Creating Multi-Modal Movie Feature Store": [[49, "creating-multi-modal-movie-feature-store"]], "Real data": [[49, "real-data"]], "Synthetic data": [[49, "synthetic-data"]], "ETL with NVTabular": [[50, "etl-with-nvtabular"]], "Defining our Preprocessing Pipeline": [[50, "defining-our-preprocessing-pipeline"]], "Running the pipeline": [[50, "running-the-pipeline"]], "Checking the pre-processing outputs": [[50, "checking-the-pre-processing-outputs"]], "Training HugeCTR Model with Pre-trained Embeddings": [[51, "training-hugectr-model-with-pre-trained-embeddings"]], "Loading pretrained movie features into non-trainable embedding layer": [[51, "loading-pretrained-movie-features-into-non-trainable-embedding-layer"]], "Define and train model": [[51, "define-and-train-model"]], "Multi-modal Example Notebooks": [[52, "multi-modal-example-notebooks"]], "HugeCTR Training with Remote File System Example": [[53, "hugectr-training-with-remote-file-system-example"]], "Setup HugeCTR": [[53, "setup-hugectr"]], "Training with HDFS Example": [[53, "training-with-hdfs-example"]], "Training a DLRM model": [[53, "training-a-dlrm-model"]], "Training a DCN model with AWS S3": [[53, "training-a-dcn-model-with-aws-s3"]], "Data preparation": [[53, "id1"], [53, "id2"]], "Training a DCN model with Google Cloud Storage": [[53, "training-a-dcn-model-with-google-cloud-storage"]], "Performance": [[54, "performance"]], "MLPerf on DGX-2 and DGX A100": [[54, "mlperf-on-dgx-2-and-dgx-a100"]], "Evaluating HugeCTR\u2019s Performance on the DGX-1": [[54, "evaluating-hugectr-s-performance-on-the-dgx-1"]], "Evaluating HugeCTR\u2019s Performance on TensorFlow": [[54, "evaluating-hugectr-s-performance-on-tensorflow"]], "Release Notes": [[55, "release-notes"]], "What\u2019s New in Version 24.06": [[55, "what-s-new-in-version-24-06"]], "What\u2019s New in Version 23.12": [[55, "what-s-new-in-version-23-12"]], "What\u2019s New in Version 23.11": [[55, "what-s-new-in-version-23-11"]], "What\u2019s New in Version 23.08": [[55, "what-s-new-in-version-23-08"]], "What\u2019s New in Version 23.06": [[55, "what-s-new-in-version-23-06"]], "What\u2019s New in Version 23.04": [[55, "what-s-new-in-version-23-04"]], "What\u2019s New in Version 23.02": [[55, "what-s-new-in-version-23-02"]], "What\u2019s New in Version 4.3": [[55, "what-s-new-in-version-4-3"]], "What\u2019s New in Version 4.2": [[55, "what-s-new-in-version-4-2"]], "What\u2019s New in Version 4.1": [[55, "what-s-new-in-version-4-1"]], "What\u2019s New in Version 4.0": [[55, "what-s-new-in-version-4-0"]], "What\u2019s New in Version 3.9": [[55, "what-s-new-in-version-3-9"]], "What\u2019s New in Version 3.8": [[55, "what-s-new-in-version-3-8"]], "What\u2019s New in Version 3.7": [[55, "what-s-new-in-version-3-7"]], "What\u2019s New in Version 3.6": [[55, "what-s-new-in-version-3-6"]], "What\u2019s New in Version 3.5": [[55, "what-s-new-in-version-3-5"]], "What\u2019s New in Version 3.4.1": [[55, "what-s-new-in-version-3-4-1"]], "What\u2019s New in Version 3.4": [[55, "what-s-new-in-version-3-4"]], "What\u2019s New in Version 3.3.1": [[55, "what-s-new-in-version-3-3-1"]], "What\u2019s New in Version 3.3": [[55, "what-s-new-in-version-3-3"]], "What\u2019s New in Version 3.2.1": [[55, "what-s-new-in-version-3-2-1"]], "What\u2019s New in Version 3.2": [[55, "what-s-new-in-version-3-2"]], "What\u2019s New in Version 3.1": [[55, "what-s-new-in-version-3-1"]], "What\u2019s New in Version 3.0.1": [[55, "what-s-new-in-version-3-0-1"]], "What\u2019s New in Version 3.0": [[55, "whats-new-in-version-3-0"]], "What\u2019s New in Version 2.3": [[55, "what-s-new-in-version-2-3"]], "Known Issues": [[55, "known-issues"]]}, "indexentries": {"init() (in module hierarchical_parameter_server)": [[8, "hierarchical_parameter_server.Init"]], "lookuplayer (class in hierarchical_parameter_server)": [[9, "hierarchical_parameter_server.LookupLayer"]], "sparselookuplayer (class in hierarchical_parameter_server)": [[9, "hierarchical_parameter_server.SparseLookupLayer"]], "call() (hierarchical_parameter_server.lookuplayer method)": [[9, "hierarchical_parameter_server.LookupLayer.call"]], "call() (hierarchical_parameter_server.sparselookuplayer method)": [[9, "hierarchical_parameter_server.SparseLookupLayer.call"]]}})
\ No newline at end of file
+Search.setIndex({"docnames": ["QAList", "additional_resources", "api/hugectr_layer_book", "api/index", "api/python_interface", "hierarchical_parameter_server/hps_database_backend", "hierarchical_parameter_server/hps_dlrm_benchmark", "hierarchical_parameter_server/hps_tf_api/index", "hierarchical_parameter_server/hps_tf_api/initialize", "hierarchical_parameter_server/hps_tf_api/layers", "hierarchical_parameter_server/hps_tf_user_guide", "hierarchical_parameter_server/hps_torch_api/index", "hierarchical_parameter_server/hps_torch_api/lookup_layer", "hierarchical_parameter_server/hps_torch_user_guide", "hierarchical_parameter_server/hps_trt_api/hps_plugin", "hierarchical_parameter_server/hps_trt_api/hps_plugin_creator", "hierarchical_parameter_server/hps_trt_api/index", "hierarchical_parameter_server/hps_trt_user_guide", "hierarchical_parameter_server/index", "hierarchical_parameter_server/profiling_hps", "hps_tf/notebooks/hierarchical_parameter_server_demo", "hps_tf/notebooks/hps_multi_table_sparse_input_demo", "hps_tf/notebooks/hps_pretrained_model_training_demo", "hps_tf/notebooks/hps_table_fusion_demo", "hps_tf/notebooks/hps_tensorflow_triton_deployment_demo", "hps_tf/notebooks/index", "hps_tf/notebooks/sok_to_hps_dlrm_demo", "hps_tf/notebooks/sok_train_demo", "hps_torch/notebooks/hps_torch_demo", "hps_torch/notebooks/index", "hps_trt/notebooks/benchmark_tf_trained_large_model", "hps_trt/notebooks/demo_for_hugectr_trained_model", "hps_trt/notebooks/demo_for_pytorch_trained_model", "hps_trt/notebooks/demo_for_tf_trained_model", "hps_trt/notebooks/index", "hugectr_contributor_guide", "hugectr_core_features", "hugectr_talks_blogs", "hugectr_user_guide", "index", "notebooks/embedding_collection", "notebooks/hps_demo", "notebooks/hugectr_e2e_demo_with_nvtabular", "notebooks/index", "notebooks/multi-modal-data/00-Intro", "notebooks/multi-modal-data/01-Download-Convert", "notebooks/multi-modal-data/02-Data-Enrichment", "notebooks/multi-modal-data/03-Feature-Extraction-Poster", "notebooks/multi-modal-data/04-Feature-Extraction-Text", "notebooks/multi-modal-data/05-Create-Feature-Store", "notebooks/multi-modal-data/06-ETL-with-NVTabular", "notebooks/multi-modal-data/07-Training-with-HugeCTR", "notebooks/multi-modal-data/index", "notebooks/training_with_remote_filesystem", "performance", "release_notes", "sparse_operation_kit"], "filenames": ["QAList.md", "additional_resources.md", "api/hugectr_layer_book.md", "api/index.rst", "api/python_interface.md", "hierarchical_parameter_server/hps_database_backend.md", "hierarchical_parameter_server/hps_dlrm_benchmark.md", "hierarchical_parameter_server/hps_tf_api/index.rst", "hierarchical_parameter_server/hps_tf_api/initialize.rst", "hierarchical_parameter_server/hps_tf_api/layers.rst", "hierarchical_parameter_server/hps_tf_user_guide.md", "hierarchical_parameter_server/hps_torch_api/index.rst", "hierarchical_parameter_server/hps_torch_api/lookup_layer.md", "hierarchical_parameter_server/hps_torch_user_guide.md", "hierarchical_parameter_server/hps_trt_api/hps_plugin.md", "hierarchical_parameter_server/hps_trt_api/hps_plugin_creator.md", "hierarchical_parameter_server/hps_trt_api/index.rst", "hierarchical_parameter_server/hps_trt_user_guide.md", "hierarchical_parameter_server/index.md", "hierarchical_parameter_server/profiling_hps.md", "hps_tf/notebooks/hierarchical_parameter_server_demo.ipynb", "hps_tf/notebooks/hps_multi_table_sparse_input_demo.ipynb", "hps_tf/notebooks/hps_pretrained_model_training_demo.ipynb", "hps_tf/notebooks/hps_table_fusion_demo.ipynb", "hps_tf/notebooks/hps_tensorflow_triton_deployment_demo.ipynb", "hps_tf/notebooks/index.md", "hps_tf/notebooks/sok_to_hps_dlrm_demo.ipynb", "hps_tf/notebooks/sok_train_demo.ipynb", "hps_torch/notebooks/hps_torch_demo.ipynb", "hps_torch/notebooks/index.md", "hps_trt/notebooks/benchmark_tf_trained_large_model.ipynb", "hps_trt/notebooks/demo_for_hugectr_trained_model.ipynb", "hps_trt/notebooks/demo_for_pytorch_trained_model.ipynb", "hps_trt/notebooks/demo_for_tf_trained_model.ipynb", "hps_trt/notebooks/index.md", "hugectr_contributor_guide.md", "hugectr_core_features.md", "hugectr_talks_blogs.md", "hugectr_user_guide.md", "index.rst", "notebooks/embedding_collection.ipynb", "notebooks/hps_demo.ipynb", "notebooks/hugectr_e2e_demo_with_nvtabular.ipynb", "notebooks/index.md", "notebooks/multi-modal-data/00-Intro.ipynb", "notebooks/multi-modal-data/01-Download-Convert.ipynb", "notebooks/multi-modal-data/02-Data-Enrichment.ipynb", "notebooks/multi-modal-data/03-Feature-Extraction-Poster.ipynb", "notebooks/multi-modal-data/04-Feature-Extraction-Text.ipynb", "notebooks/multi-modal-data/05-Create-Feature-Store.ipynb", "notebooks/multi-modal-data/06-ETL-with-NVTabular.ipynb", "notebooks/multi-modal-data/07-Training-with-HugeCTR.ipynb", "notebooks/multi-modal-data/index.md", "notebooks/training_with_remote_filesystem.ipynb", "performance.md", "release_notes.md", "sparse_operation_kit.md"], "titles": ["Questions and Answers", "Additional Resources", "HugeCTR Layer Classes and Methods", "HugeCTR API Documentation", "HugeCTR Python Interface", "Hierarchical Parameter Server Database Backend", "Benchmark the DLRM Model with HPS", "Hierarchical Parameter Server API", "HPS Initialize", "HPS Layers", "Hierarchical Parameter Server Plugin for TensorFlow", "HPS Plugin for Torch API", "HPS Plugin for Torch", "Hierarchical Parameter Server Plugin for Torch", "HPS Plugin", "HPS Plugin Creator", "HPS Plugin for TensorRT API", "Hierarchical Parameter Server Plugin for TensorRT", "Hierarchical Parameter Server", "Profiling HPS", "Hierarchical Parameter Server Demo", "HPS for Multiple Tables and Sparse Inputs", "HPS Pretrained Model Training Demo", "HPS Table Fusion Demo", "Deploy SavedModel using HPS with Triton TensorFlow Backend", "Hierarchical Parameter Server Notebooks", "SOK to HPS DLRM Demo", "SOK Train DLRM Demo", "HPS Torch Demo", "Hierarchical Parameter Server Notebooks", "HPS TensorRT Plugin Benchmark for TensorFlow Large Model", "HPS TensorRT Plugin Demo for HugeCTR Trained Model", "HPS TensorRT Plugin Demo for PyTorch Trained Model", "HPS TensorRT Plugin Demo for TensorFlow Trained Model", "HPS Plugin for TensorRT Notebooks", "Contributing to HugeCTR", "HugeCTR Core Features", "HugeCTR Talks and Blogs", "Introduction to HugeCTR", "Merlin HugeCTR", "HugeCTR Embedding Collection", "Hierarchical Parameter Server Demo", "HugeCTR End-end Example with NVTabular", "HugeCTR Example Notebooks", "Training Recommender Systems on Multi-modal Data", "MovieLens-25M: Download and Convert", "MovieLens Data Enrichment", "Movie Poster Feature Extraction with ResNet", "Movie Synopsis Feature Extraction with Bart text summarization", "Creating Multi-Modal Movie Feature Store", "ETL with NVTabular", "Training HugeCTR Model with Pre-trained Embeddings", "Multi-modal Example Notebooks", "HugeCTR Training with Remote File System Example", "Performance", "Release Notes", "Sparse Operation Kit"], "terms": {"try": [0, 5, 31, 36, 41, 46, 47, 55], "provid": [0, 2, 4, 5, 10, 13, 17, 18, 20, 21, 22, 25, 26, 28, 29, 30, 31, 34, 35, 36, 38, 39, 40, 41, 43, 44, 50, 52, 53, 54, 55, 56], "recommend": [0, 2, 4, 5, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 37, 38, 39, 43, 45, 50, 52, 55], "variou": [0, 5, 13, 36, 38], "industri": [0, 36], "high": [0, 3, 5, 10, 13, 17, 18, 20, 21, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 46, 50, 54, 55], "effici": [0, 4, 5, 13, 22, 30, 54, 55], "solut": [0, 18, 36, 38, 55], "onlin": [0, 4, 5, 8, 10, 30, 36, 55], "offlin": [0, 4, 5, 43, 55], "also": [0, 2, 4, 5, 6, 14, 19, 20, 21, 22, 24, 25, 26, 30, 36, 38, 40, 41, 43, 44, 46, 50, 51, 55], "refer": [0, 2, 4, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 44, 53, 55], "design": [0, 2, 4, 5, 13, 35, 36, 37, 38, 39, 50, 55, 56], "develop": [0, 5, 25, 29, 34, 36, 37, 39, 40, 43, 55], "want": [0, 2, 4, 5, 9, 30, 34, 35, 36, 45, 50, 53, 55], "port": [0, 4, 5, 25, 29, 30, 34, 41, 42, 43, 53, 55], "optim": [0, 2, 4, 19, 20, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32, 33, 37, 40, 41, 42, 51, 53, 54, 55], "current": [0, 2, 4, 8, 20, 21, 22, 26, 30, 32, 33, 38, 41, 45, 46, 47, 50, 53, 55], "v2": [0, 2, 4, 24, 47, 55], "dnn": [0, 20, 21, 22, 23, 24, 36, 54, 55, 56], "wdl": [0, 5, 19, 38, 41, 54], "dcn": [0, 2, 4, 36, 38, 54, 55], "deepfm": [0, 38, 55], "dlrm": [0, 10, 17, 25, 30, 31, 32, 33, 38, 54, 55], "variant": [0, 30, 38, 55], "wide": [0, 38, 54, 55], "system": [0, 2, 4, 5, 10, 13, 17, 18, 20, 21, 22, 23, 24, 27, 28, 31, 32, 33, 35, 36, 37, 38, 41, 45, 50, 51, 52, 54, 55], "directori": [0, 4, 5, 10, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 47, 50, 54, 55], "repositori": [0, 4, 10, 18, 19, 24, 31, 32, 33, 35, 36, 38, 39, 40, 41, 53, 54, 55], "github": [0, 4, 19, 23, 25, 28, 29, 30, 33, 34, 35, 36, 38, 39, 40, 41, 43, 47, 50, 53, 54, 55], "them": [0, 2, 4, 9, 13, 20, 21, 22, 23, 24, 26, 30, 35, 50, 55], "express": [0, 2, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "confin": 0, "aforement": [0, 2], "you": [0, 2, 4, 5, 8, 9, 10, 13, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 49, 50, 53, 55, 56], "your": [0, 2, 4, 5, 10, 13, 17, 19, 22, 25, 29, 30, 31, 32, 33, 34, 36, 38, 41, 43, 53, 55], "own": [0, 2, 25, 29, 34, 38], "combin": [0, 2, 4, 5, 9, 10, 13, 17, 20, 21, 22, 26, 27, 28, 31, 32, 33, 35, 36, 40, 41, 42, 44, 51, 53, 55], "ha": [0, 2, 4, 5, 6, 9, 12, 14, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 38, 41, 50, 54, 55], "tf": [0, 6, 8, 9, 10, 25, 26, 27, 35, 41, 54, 55], "yet": [0, 4, 20, 21, 24, 26, 30, 55], "compat": [0, 2, 5, 10, 20, 21, 22, 24, 30, 33, 36, 41, 42, 55, 56], "export": [0, 5, 30, 32, 40, 55], "follow": [0, 2, 4, 5, 6, 8, 10, 13, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 47, 50, 53, 54, 55], "instruct": [0, 19, 20, 21, 22, 23, 24, 26, 30, 33, 35, 40, 41, 42, 53, 55], "dump_to_tf": [0, 55], "tutori": [0, 55], "ye": [0, 5, 19, 41], "check": [0, 2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 53, 55, 56], "out": [0, 2, 4, 5, 22, 24, 30, 32, 33, 36, 41, 43, 50, 55], "dcn2node": 0, "more": [0, 2, 4, 5, 10, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 38, 39, 40, 41, 43, 50, 54, 55], "detail": [0, 3, 4, 6, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 43, 55, 56], "across": [0, 2, 4, 5, 10, 36, 38, 39, 41, 50, 55], "so": [0, 2, 4, 5, 10, 13, 17, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 40, 41, 45, 50, 55], "have": [0, 2, 4, 5, 9, 10, 18, 20, 21, 24, 26, 30, 35, 36, 40, 41, 42, 49, 50, 53, 54, 55], "veri": [0, 36, 40, 55], "larg": [0, 2, 5, 6, 10, 13, 17, 18, 34, 36, 37, 38, 40, 41, 46, 48, 50, 55, 56], "just": [0, 30, 42, 47, 55], "mani": [0, 5, 30, 55, 56], "That": [0, 36, 55], "why": [0, 36], "name": [0, 2, 4, 5, 9, 12, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 38, 40, 41, 42, 43, 46, 47, 50, 51, 53, 55], "suppos": [0, 2, 41], "1tb": [0, 30, 36, 38, 54, 55], "16xv100": 0, "32gb": [0, 20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 53], "take": [0, 4, 5, 6, 19, 30, 31, 32, 33, 38, 41, 45, 46, 50, 55, 56], "case": [0, 2, 4, 5, 6, 30, 32, 36, 41, 53, 54, 55, 56], "comput": [0, 2, 4, 5, 6, 9, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 40, 41, 50, 55], "0": [0, 2, 4, 5, 6, 8, 9, 10, 13, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 54], "v100": [0, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 35, 38, 40, 41, 42, 43, 51, 53, 54, 55], "t4": [0, 10, 13, 17, 38], "A": [0, 2, 4, 5, 9, 19, 25, 29, 30, 34, 36, 37, 38, 40, 41, 43, 50, 55], "machin": [0, 2, 4, 5, 6, 25, 29, 34, 37, 41, 42, 43, 54, 55, 56], "mandatori": 0, "achiev": [0, 2, 4, 5, 6, 13, 28, 30, 36, 41, 54, 55], "best": [0, 2, 4, 5, 6, 22, 28, 36], "perform": [0, 2, 4, 5, 6, 9, 10, 12, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 33, 34, 35, 36, 37, 41, 55], "exploit": [0, 10], "nvswitch": [0, 2], "inter": [0, 36, 41, 54, 55], "bandwidth": [0, 2, 4, 5, 36, 55], "ucx": [0, 42], "howev": [0, 2, 5, 10, 17, 30, 35, 38, 41, 43, 49, 50, 55], "rdma": [0, 4, 36, 55], "maxim": [0, 5, 30], "transact": [0, 36, 54, 55], "approach": [0, 30, 41], "offload": [0, 5, 55], "workload": [0, 4, 55, 56], "oper": [0, 2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 30, 33, 37, 40, 41, 43, 50, 55], "mainli": 0, "decid": [0, 2, 4], "kind": [0, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 53, 55], "o": [0, 2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 45, 46, 50, 51, 55], "devic": [0, 4, 5, 8, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 47, 50, 51, 53, 54, 55], "dataset": [0, 2, 3, 5, 9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 40, 41, 42, 43, 44, 46, 50, 52, 53, 54, 55], "section": [0, 4, 5, 30, 33, 35, 40, 45, 46, 49, 51, 55], "api": [0, 2, 8, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 36, 37, 41, 43, 46, 47, 50, 53, 55], "document": [0, 2, 4, 5, 15, 18, 19, 26, 27, 30, 33, 35, 36, 39, 41, 43, 55, 56], "introduc": [0, 2, 4, 37, 43, 55], "our": [0, 4, 5, 6, 10, 17, 25, 29, 30, 34, 35, 36, 38, 39, 43, 45, 51, 53, 54, 55], "first": [0, 2, 4, 5, 8, 10, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 45, 46, 47, 48, 50, 51, 55], "version": [0, 2, 4, 5, 6, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 49, 50, 51, 53, 54], "exampl": [0, 2, 4, 5, 8, 9, 15, 19, 25, 29, 30, 34, 35, 36, 38, 40, 41, 44, 50, 54, 55], "hashtabl": [0, 26, 27], "base": [0, 2, 4, 5, 9, 17, 19, 24, 25, 30, 31, 32, 33, 34, 36, 38, 41, 45, 50, 52, 55], "dynam": [0, 2, 4, 5, 23, 33, 38, 41, 55], "insert": [0, 2, 5, 6, 19, 28, 30, 31, 32, 33, 38, 41, 55], "new": [0, 4, 5, 22, 24, 25, 38, 41, 42, 46, 50], "ad": [0, 2, 4, 41, 50, 54, 55], "runtim": [0, 5, 8, 10, 13, 17, 25, 29, 34, 38, 41, 42, 43, 55], "skip": [0, 31, 40, 41, 49, 55], "In": [0, 2, 4, 5, 6, 8, 9, 20, 21, 22, 24, 26, 30, 31, 32, 33, 35, 36, 40, 41, 42, 45, 46, 47, 48, 50, 51, 53, 54, 55, 56], "field": [0, 2, 4, 5, 6, 15, 20, 21, 22, 24, 26, 27, 32, 33, 36, 41, 44, 50], "The": [0, 2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 45, 46, 50, 51, 52, 53, 54, 55], "one": [0, 2, 4, 5, 6, 8, 9, 14, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 41, 43, 54, 55], "hot": [0, 2, 4, 10, 19, 21, 24, 27, 31, 36, 41, 45, 50, 55], "number": [0, 2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 40, 41, 42, 44, 45, 51, 53, 54, 55], "specifi": [0, 2, 4, 5, 8, 9, 10, 12, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 42, 43, 53, 55], "slot_num": [0, 2, 4, 5, 20, 21, 22, 24, 26, 27, 30, 32, 33, 51], "There": [0, 2, 4, 10, 19, 30, 31, 32, 33, 38, 43, 55], "sub": [0, 3, 41, 55], "class": [0, 3, 9, 11, 14, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 40, 46, 50, 55], "thei": [0, 4, 5, 20, 21, 22, 24, 26, 27, 45, 47, 55, 56], "distinguish": [0, 55], "method": [0, 3, 6, 33, 40, 41, 42, 53, 55], "distribut": [0, 2, 4, 5, 8, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 36, 37, 38, 39, 40, 41, 42, 53, 55, 56], "call": [0, 2, 4, 8, 9, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 41, 44, 50, 55], "local": [0, 4, 5, 17, 18, 19, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 40, 41, 42, 43, 49, 53, 55], "mai": [0, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 33, 35, 36, 37, 40, 42, 50, 53, 55], "accord": [0, 2, 4, 5, 24, 30, 31, 32, 33, 36, 55], "index": [0, 2, 4, 9, 12, 15, 24, 26, 27, 30, 31, 32, 33, 36, 42, 49, 51, 53, 55], "regardless": [0, 36, 56], "mean": [0, 2, 4, 5, 9, 19, 21, 22, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 40, 41, 43, 47, 48, 50, 55], "thu": [0, 2, 22, 24, 26, 40, 55], "smaller": [0, 5, 36, 55], "than": [0, 2, 4, 5, 9, 19, 24, 30, 36, 43, 50, 54, 55], "reduct": [0, 2, 9, 22, 36, 38], "per": [0, 2, 4, 5, 6, 31, 34, 41, 45, 55], "global": [0, 4, 5, 8, 9, 20, 21, 22, 24, 26, 27, 31, 32, 33, 36, 40, 41, 42, 50, 51, 53, 55], "reduc": [0, 2, 4, 5, 22, 30, 31, 32, 33, 36, 40, 41, 42, 51, 53, 55], "overal": [0, 5, 36], "much": [0, 36, 55], "less": [0, 4, 30, 36, 55], "made": [0, 2, 55], "some": [0, 2, 4, 5, 23, 24, 30, 35, 41, 43, 46, 48, 55], "larger": [0, 4, 5, 9, 36, 55], "trasact": 0, "iter": [0, 2, 4, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "after": [0, 2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 42, 53], "forward": [0, 2, 4, 5, 6, 9, 12, 17, 28, 30, 32, 38, 41, 55], "kernel": [0, 4, 24, 30, 31, 32, 33, 46, 47, 48, 55], "function": [0, 2, 4, 5, 8, 9, 12, 19, 20, 21, 22, 24, 26, 27, 31, 32, 33, 35, 38, 41, 50, 55, 56], "collect": [0, 3, 4, 10, 13, 17, 19, 30, 38, 50, 55], "commun": [0, 2, 4, 5, 36, 55], "librari": [0, 4, 10, 13, 17, 18, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 39, 41, 48, 50, 55], "nccl": [0, 4, 22, 31, 36, 40, 41, 42, 51, 53, 55], "should": [0, 2, 4, 5, 8, 9, 10, 14, 20, 21, 22, 24, 28, 30, 31, 32, 33, 35, 36, 41, 47, 48, 49, 50, 55], "sourc": [0, 3, 8, 9, 10, 13, 17, 19, 31, 36, 38, 39, 40, 41, 42, 43, 51, 53, 55], "where": [0, 2, 5, 9, 17, 36, 40, 41, 44, 46, 55], "spars": [0, 3, 4, 5, 9, 19, 22, 24, 25, 26, 27, 30, 31, 37, 38, 40, 41, 42, 43, 51, 53, 55], "an": [0, 2, 4, 5, 8, 9, 15, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 35, 36, 37, 38, 39, 41, 42, 43, 46, 47, 50, 53, 55], "arrai": [0, 2, 4, 15, 20, 21, 22, 24, 26, 28, 31, 32, 33, 41, 42, 47, 51, 55], "belong": [0, 4], "last": [0, 2, 4, 5, 9, 20, 21, 22, 26, 33, 41, 47, 48], "second": [0, 2, 4, 5, 21, 23, 28, 30, 33, 55], "element": [0, 2, 4, 51, 55], "below": [0, 2, 4, 6, 15, 19, 25, 29, 30, 34, 35, 43, 48, 49, 51], "top": [0, 2, 4, 26, 27, 32, 33, 54, 55], "data1": [0, 2, 4, 40, 41, 51, 53], "type": [0, 3, 4, 5, 8, 9, 10, 14, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 36, 38, 40, 41, 42, 44, 50, 51, 53, 55], "distributedslot": 0, "max_feature_num_per_sampl": 0, "data2": [0, 40, 41], "binari": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 26, 30, 33, 41, 50, 51, 55], "raw": [0, 2, 3, 23, 24, 28, 30, 31, 32, 33, 38, 41, 44, 50, 51, 55], "snapshot": [0, 4, 31, 40, 41, 42, 51, 53], "json": [0, 2, 4, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 41, 42, 47, 50, 51, 53, 55], "interv": [0, 4, 5, 31, 40, 41, 42, 51, 53], "checkpoint": [0, 30, 47], "prefix": [0, 4, 5, 41], "snapshot_prefix": [0, 2, 4, 31, 40, 41, 42, 53], "modifi": [0, 4, 17, 30, 33, 41, 55], "dense_model_fil": [0, 4, 5, 41], "sparse_model_fil": [0, 4, 5, 41], "solver": [0, 2, 3, 31, 40, 41, 42, 51, 53, 55], "write": [0, 4, 5, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "script": [0, 4, 6, 28, 30, 36, 38, 41, 43, 47, 53, 54, 55], "demonstr": [0, 4, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 41, 43, 44, 52, 55], "uniqu": [0, 2, 4, 5, 51, 55], "preprocess": [0, 4, 30, 40, 43, 54, 55], "e": [0, 4, 5, 6, 9, 10, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 36, 41, 46, 47], "g": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 36, 41, 53], "offset": [0, 2, 4, 27, 55], "hash": [0, 2, 5, 31, 38, 41, 42, 51, 53, 55], "nnz": [0, 4, 21, 22, 26, 31, 41], "look": [0, 4, 5, 9, 19, 30, 41, 45, 49, 50, 55], "up": [0, 2, 4, 5, 9, 21, 24, 25, 28, 29, 30, 31, 33, 34, 36, 40, 41, 42, 50, 51, 53, 54, 55], "firstli": [0, 53], "guid": [0, 4, 22, 24, 30, 31, 32, 33, 38, 55], "secondli": [0, 53], "data_gener": [0, 4, 31, 38, 41, 55], "gener": [0, 2, 3, 5, 6, 14, 19, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 35, 50, 54, 55], "random": [0, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 45, 49, 55], "see": [0, 2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 39, 40, 41, 42, 43, 45, 50, 53, 54, 55], "start": [0, 2, 4, 5, 10, 13, 17, 19, 23, 24, 26, 28, 30, 31, 32, 33, 36, 38, 40, 41, 42, 46, 47, 51, 53, 55], "readm": [0, 40, 41, 55], "thirdli": 0, "huge_ctr": 0, "your_config": 0, "alloc": [0, 4, 5, 26, 30, 31, 32, 33, 40, 41, 42, 55], "accordingli": [0, 33, 55], "necessarili": 0, "exact": [0, 2], "depend": [0, 2, 4, 5, 10, 13, 17, 23, 28, 31, 35, 38, 40, 41, 42, 45, 50, 51, 53, 55], "vocabulari": [0, 2, 21, 31, 40, 42, 51, 53, 55], "workspac": [0, 2, 19, 30, 47, 48, 55], "calcul": [0, 2, 4, 5, 42, 50, 55], "tool": [0, 4, 17, 19, 30, 31, 32, 33, 40, 41, 54, 55], "workspace_s": 0, "usual": [0, 2, 53], "real": [0, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 45, 55], "becaus": [0, 2, 5, 6, 19, 26, 27, 30, 41, 50, 54, 55, 56], "non": [0, 2, 4, 5, 10, 20, 21, 22, 23, 24, 26, 30, 31, 33, 35, 40, 41, 42, 43, 53, 55], "uniform": [0, 2, 4, 27, 38], "kei": [0, 2, 4, 5, 9, 10, 12, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 36, 38, 40, 41, 46, 47, 51, 53, 55], "argument": [0, 2, 4, 8, 12, 19, 20, 21, 22, 23, 24, 26, 27, 32, 33, 35, 40, 41, 43, 50, 55], "usag": [0, 3, 4, 5, 10, 19, 30, 31, 32, 33, 40, 42, 55], "replac": [0, 5, 6, 17, 20, 21, 22, 24, 26, 30, 31, 32, 33, 55], "avoid": [0, 2, 4, 5, 20, 21, 22, 26, 30, 33, 36, 41, 55], "wast": [0, 2], "caus": [0, 2, 4, 5, 32, 55], "imbalanc": [0, 2], "add": [0, 3, 10, 13, 15, 17, 19, 21, 25, 29, 30, 31, 34, 35, 38, 40, 41, 42, 43, 50, 51, 53, 55], "maximum": [0, 2, 4, 5, 6, 28, 30, 51, 55], "equat": [0, 4], "_size": [0, 4], "_arrai": [0, 4], "k": [0, 2, 4, 47], "max": [0, 4, 5, 19, 21, 22, 23, 26, 28, 30, 31, 32, 33, 41], "limits_i": [0, 4], "k_i": [0, 4], "list": [0, 2, 3, 5, 6, 9, 20, 21, 24, 26, 27, 28, 30, 32, 33, 40, 41, 42, 45, 46, 47, 50, 51, 55], "inform": [0, 2, 4, 5, 10, 19, 23, 24, 28, 35, 36, 38, 39, 40, 41, 46, 50, 53, 54, 55], "about": [0, 3, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 39, 41, 50, 55], "relat": [0, 2, 4, 5, 24, 35, 53, 55], "amount": [0, 5, 40, 55, 56], "localizedslotsparseembeddinghash": [0, 3, 51, 55], "If": [0, 2, 4, 5, 9, 19, 25, 29, 30, 31, 32, 33, 34, 35, 36, 40, 41, 43, 45, 46, 49, 55], "help": [0, 2, 4, 5, 10, 19, 36, 40, 42, 53, 55], "altern": [0, 4, 5, 30, 43, 55], "both": [0, 2, 4, 5, 6, 26, 27, 35, 36, 41, 49, 50, 53, 54, 55], "localizedslotsparseembeddingonehot": [0, 3, 4], "hybridsparseembed": [0, 4], "workspace_size_per_gpu_in_md": 0, "while": [0, 2, 4, 5, 6, 13, 18, 20, 21, 24, 26, 27, 30, 31, 32, 33, 41, 46, 50, 54, 55, 56], "highli": [0, 2, 55], "reli": [0, 4, 5, 19, 35, 41, 55], "pcie": [0, 34], "connect": [0, 2, 4, 5, 21, 22, 23, 24, 25, 26, 29, 30, 33, 34, 35, 38, 41, 42, 43, 55], "insid": [0, 4, 22, 30, 55], "expect": [0, 50, 55], "150gb": 0, "direct": [0, 50], "It": [0, 2, 4, 5, 8, 10, 12, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 36, 38, 40, 41, 43, 50, 55, 56], "3x": [0, 55], "pci": [0, 20, 21, 22, 23, 24, 26, 33, 41], "convert": [0, 6, 10, 17, 20, 21, 22, 24, 38, 44, 51, 52, 54, 55], "facilit": [0, 10, 30, 55], "process": [0, 2, 4, 5, 8, 24, 30, 31, 32, 33, 36, 40, 42, 45, 46, 49, 54, 55, 56], "save_params_to_fil": [0, 3], "familiar": [0, 4], "pre": [0, 5, 10, 25, 52, 53, 55], "hugectr_criteo": 0, "ipynb": [0, 6, 21, 22, 23, 24, 25, 26, 27, 29, 34, 36, 43, 44, 45, 46, 55], "inher": [0, 38], "extra": [0, 4, 46, 47, 48, 55], "abstract": [0, 2, 4, 50, 55], "awai": [0, 2, 50, 55], "slice": [0, 3, 33, 53, 55], "code": [0, 2, 8, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 50, 53, 55, 56], "cooper": 0, "thread": [0, 4, 5, 8, 20, 21, 22, 23, 24, 26, 31, 32, 33, 35, 38, 41, 42, 46, 54, 55], "cta": 0, "launch": [0, 5, 6, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 41, 43, 55], "foremost": 0, "exce": [0, 2, 5, 18, 55], "block": [0, 8, 30, 31, 32, 33, 41, 46, 55], "would": [0, 5, 32, 55], "better": [0, 2, 4, 5, 30, 42, 55], "warp": [0, 55], "sake": [0, 41], "occup": [0, 19], "still": [0, 4, 5, 24, 55], "freeli": 0, "architectur": [0, 10, 13, 17, 18, 20, 28, 36, 38, 47, 50, 55], "long": [0, 4, 5, 10, 32, 41, 55], "compli": 0, "limit": [0, 3, 5, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 53, 55, 56], "share": [0, 2, 5, 17, 30, 35, 41, 53, 55], "rank": [0, 2, 5, 9, 55], "ipc": [0, 19, 43, 47, 48, 55], "pin": [0, 55], "page": [0, 30, 37, 41, 55], "lock": [0, 55], "resourc": [0, 4, 5, 10, 26, 50, 55, 56], "issu": [0, 2, 5, 30, 33, 35], "option": [0, 2, 4, 5, 6, 19, 22, 24, 30, 33, 35, 36, 38, 41, 42, 46, 53, 55], "docker": [0, 5, 10, 13, 17, 19, 34, 35, 38, 41, 47, 48, 53, 55], "command": [0, 6, 10, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 38, 41, 43, 49, 53, 55], "host": [0, 4, 5, 10, 13, 17, 18, 19, 25, 29, 31, 32, 33, 34, 38, 41, 42, 43, 47, 48, 54, 55], "ulimit": [0, 19, 43, 55], "memlock": [0, 19, 43, 55], "stack": [0, 19, 28, 43, 47], "67108864": [0, 19, 43], "leverag": [0, 4, 6, 8, 10, 13, 17, 22, 24, 25, 30, 36, 50, 55], "hirarch": 0, "paramet": [0, 2, 4, 8, 9, 15, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 37, 43, 53, 55, 56], "cach": [0, 4, 6, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 36, 37, 41, 47, 55], "hierarch": [0, 2, 4, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 37, 43, 55], "storag": [0, 4, 5, 10, 13, 17, 18, 20, 28, 30, 31, 32, 33, 36, 40, 41, 42, 55], "encompass": [0, 10, 17], "databas": [0, 4, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 36, 41, 46, 55], "backend": [0, 4, 6, 10, 13, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33, 35, 36, 41, 47, 53, 55], "updat": [0, 4, 19, 22, 24, 27, 32, 35, 41, 43, 50, 53, 55], "manag": [0, 5, 10, 26, 30, 31, 32, 33, 41, 46, 55], "exhaust": [0, 5, 55], "constantli": [0, 10], "trigger": [0, 5, 8, 22, 33, 36, 55], "thi": [0, 2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56], "messag": [0, 5, 19, 33, 35, 41, 42, 55], "scenario": [0, 36, 55, 56], "either": [0, 4, 5, 9, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 53], "enforc": [0, 50], "mode": [0, 2, 4, 5, 6, 10, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 51, 53, 55], "hit_rate_threshold": [0, 4, 5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "extend": [0, 2, 5, 10, 21, 22, 26, 27, 55], "enough": [0, 2, 55], "number_of_worker_buffers_in_pool": [0, 4, 5], "pleas": [0, 2, 4, 5, 6, 10, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 46, 53, 55, 56], "hp": [0, 4, 18, 25, 27, 29, 36, 43, 55], "talk": [1, 55], "blog": [1, 54, 55], "question": [1, 35], "answer": 1, "contribut": [1, 55], "hugectr": [1, 5, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 44, 50, 52, 55], "differ": [2, 4, 5, 10, 17, 18, 19, 22, 23, 28, 31, 33, 34, 35, 36, 40, 41, 45, 55], "correspond": [2, 4, 5, 9, 36, 41, 50, 55], "python": [2, 3, 5, 10, 13, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 36, 37, 38, 41, 42, 43, 49, 51, 53, 55, 56], "descript": [2, 15, 40, 42, 44, 55], "each": [2, 4, 5, 8, 9, 10, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 34, 36, 38, 40, 41, 42, 43, 50, 51, 53, 54, 55], "includ": [2, 4, 5, 10, 17, 18, 19, 36, 38, 41, 44, 45, 46, 55], "its": [2, 4, 5, 6, 9, 20, 21, 22, 24, 25, 29, 30, 33, 34, 36, 38, 43, 46, 55], "data": [2, 3, 5, 6, 9, 14, 19, 20, 21, 22, 24, 26, 27, 32, 33, 35, 36, 43, 45, 47, 50, 51, 52, 54, 55, 56], "model": [2, 3, 8, 9, 10, 12, 13, 15, 17, 18, 19, 23, 24, 25, 28, 34, 35, 37, 38, 41, 43, 44, 47, 50, 52, 54, 55, 56], "instanc": [2, 4, 5, 6, 9, 30, 33, 36, 46, 47, 48, 55, 56], "sparseembed": [2, 4, 31, 41, 42, 51, 53, 55], "denselay": [2, 4, 31, 40, 41, 42, 51, 53, 55], "can": [2, 4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 43, 44, 45, 46, 50, 53, 54, 55, 56], "access": [2, 5, 10, 13, 17, 18, 25, 29, 30, 31, 34, 40, 41, 42, 43, 51, 53, 55], "label_dim": [2, 4, 5, 31, 40, 41, 42, 51, 53, 55], "integ": [2, 4, 5, 12, 38, 50, 54], "label": [2, 4, 9, 20, 21, 22, 24, 26, 27, 31, 32, 33, 35, 38, 40, 41, 42, 50, 51, 53, 54, 55], "dimens": [2, 4, 9, 20, 21, 22, 24, 26, 27, 32, 33, 55], "1": [2, 4, 5, 6, 8, 9, 10, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 40, 42, 45, 46, 47, 48, 49, 50, 51, 53], "impli": [2, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "i": [2, 4, 5, 6, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55, 56], "For": [2, 4, 5, 6, 9, 10, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 50, 54, 55], "item": [2, 4, 44, 46, 47, 48, 53, 54, 55], "click": [2, 36, 37, 38, 39, 54, 55], "NO": [2, 4, 19, 41], "default": [2, 4, 5, 9, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 38, 40, 41, 43, 54, 55], "valu": [2, 4, 5, 8, 9, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 40, 41, 47, 48, 49, 51, 55], "user": [2, 4, 5, 10, 13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 38, 40, 42, 44, 45, 50, 51, 53, 54, 55], "label_nam": [2, 4, 31, 40, 41, 42, 51, 53], "string": [2, 4, 5, 8, 9, 12, 15, 31, 41, 45, 50, 55], "tensor": [2, 4, 9, 12, 20, 21, 22, 24, 25, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53, 55], "referenc": [2, 10, 38], "dense_dim": [2, 4, 22, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "continu": [2, 4, 5, 30, 43, 46, 50, 55], "featur": [2, 4, 5, 9, 20, 21, 22, 24, 25, 26, 27, 30, 31, 32, 33, 35, 38, 40, 41, 42, 44, 45, 46, 50, 52, 53, 54, 55], "set": [2, 4, 5, 8, 17, 20, 21, 23, 25, 26, 29, 30, 33, 34, 36, 38, 40, 41, 43, 46, 47, 50, 53, 54, 55], "dense_nam": [2, 4, 31, 40, 41, 42, 51, 53], "data_reader_sparse_param_arrai": [2, 4, 31, 40, 41, 42, 51, 53], "datareadersparseparam": [2, 4, 31, 40, 41, 42, 51, 53], "categor": [2, 4, 30, 38, 44, 45, 50, 51, 54, 55], "construct": [2, 4, 41, 50, 55], "sparse_nam": 2, "nnz_per_slot": [2, 51, 55], "is_fixed_length": [2, 51, 55], "reader": [2, 4, 31, 35, 38, 40, 41, 42, 51, 53, 55], "int": [2, 4, 5, 8, 9, 27, 28, 30, 31, 32, 33, 41, 42, 51, 55], "which": [2, 4, 5, 6, 8, 9, 12, 13, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 43, 50, 54, 55, 56], "appli": [2, 4, 5, 13, 19, 20, 24, 25, 28, 30, 35, 36, 40, 50, 54, 55], "everi": [2, 4, 32, 55], "slot": [2, 4, 5, 21, 22, 26, 36, 38, 41, 42, 55], "could": [2, 5, 22, 24, 30, 33, 41, 55], "conveni": [2, 10, 13, 17, 19, 25, 29, 34, 38, 43, 55], "all": [2, 4, 5, 6, 8, 9, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 50, 51, 53, 54, 55, 56], "same": [2, 4, 5, 6, 9, 12, 17, 20, 21, 23, 24, 25, 26, 28, 30, 32, 33, 36, 50, 54, 55], "Or": 2, "initi": [2, 4, 5, 7, 9, 12, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 36, 38, 41, 42, 43, 50, 55], "when": [2, 4, 5, 8, 10, 14, 15, 17, 21, 22, 24, 25, 27, 28, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 43, 50, 53, 55], "length": [2, 4, 5, 24, 27, 41], "ident": [2, 5, 24, 30, 33, 55], "note": [2, 4, 5, 9, 19, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 36, 40, 41, 43, 46, 47, 48, 51, 53], "rawasync": [2, 4, 55], "onli": [2, 4, 5, 8, 10, 20, 22, 24, 30, 31, 32, 33, 35, 36, 38, 40, 41, 50, 51, 54, 55, 56], "static": [2, 4, 5, 19, 28, 30, 31, 32, 41, 55], "support": [2, 4, 5, 9, 10, 13, 15, 17, 19, 20, 21, 22, 24, 26, 28, 30, 31, 32, 33, 35, 38, 40, 41, 48, 50, 51, 53, 55, 56], "impact": [2, 55], "parquet": [2, 3, 31, 38, 40, 41, 42, 45, 49, 50, 51, 53, 55], "identifi": [2, 38, 47, 55], "whether": [2, 4, 5, 41, 56], "among": [2, 4, 36, 56], "sampl": [2, 4, 5, 6, 10, 13, 17, 28, 30, 31, 35, 36, 38, 40, 41, 42, 55], "true": [2, 4, 5, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 42, 46, 47, 48, 51, 53, 55], "transfer": [2, 10, 41, 55], "time": [2, 5, 8, 17, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 44, 45, 46, 50, 51, 53, 54, 55], "13": [2, 4, 6, 21, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53, 54, 55], "26": [2, 4, 5, 6, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 47, 51, 53, 54], "wide_data": [2, 4, 42], "2": [2, 4, 5, 6, 8, 9, 10, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 40, 42, 45, 47, 49, 50, 51, 53], "deep_data": [2, 4, 42], "One": 2, "sever": [2, 4, 5, 10, 19, 20, 21, 22, 23, 24, 30, 36, 40, 44, 52, 55], "befor": [2, 4, 5, 8, 9, 10, 21, 22, 23, 24, 26, 27, 35, 38, 40, 41, 42, 43, 47, 53, 55], "embedding_typ": [2, 4, 31, 41, 42, 51, 53], "embedding_t": [2, 4, 28, 31, 41, 42, 51, 53], "doe": [2, 4, 5, 19, 22, 25, 26, 29, 30, 31, 32, 33, 34, 43, 55], "must": [2, 4, 5, 8, 9, 14, 17, 27, 30, 33, 36, 55], "workspace_size_per_gpu_in_mb": [2, 4, 31, 41, 42, 51, 53, 55], "memori": [2, 4, 5, 10, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 36, 40, 41, 42, 43, 50, 55, 56], "size": [2, 4, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 34, 36, 40, 41, 42, 46, 50, 51, 53, 54, 55], "megabyt": 2, "gpu": [2, 4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 48, 50, 51, 53, 54, 55, 56], "big": 2, "hold": [2, 5], "state": [2, 4, 5, 24, 31, 35, 36, 41, 42, 48, 50, 51, 53, 55], "dure": [2, 4, 5, 20, 21, 24, 26, 27, 30, 36, 38, 55], "train": [2, 3, 10, 17, 18, 19, 23, 25, 34, 37, 38, 39, 43, 47, 50, 52, 54, 55, 56], "evalu": [2, 3, 5, 8, 20, 21, 24, 26, 31, 40, 41, 42, 50, 51, 53, 55], "To": [2, 4, 5, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 33, 34, 35, 36, 38, 40, 41, 42, 43, 53, 55], "understand": [2, 55], "how": [2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 40, 41, 43, 50, 52, 55], "slot_size_arrai": [2, 4, 31, 40, 41, 42, 51, 53, 55], "embedding_vec_s": [2, 4, 20, 21, 22, 23, 24, 26, 28, 31, 32, 33, 41, 42, 51, 53], "vector": [2, 4, 5, 9, 10, 12, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 38, 55], "intra": [2, 36, 54], "sum": [2, 4, 9, 21, 40, 41, 42, 51, 53, 55], "sparse_embedding_nam": [2, 4, 31, 41, 42, 51, 53], "bottom_nam": [2, 4, 31, 40, 41, 42, 51, 53], "bottom": [2, 26, 27, 32, 33, 55], "consum": [2, 5, 55, 56], "predefin": 2, "from": [2, 4, 5, 9, 10, 13, 14, 17, 18, 19, 25, 29, 31, 32, 33, 36, 40, 42, 43, 44, 45, 48, 49, 50, 51, 53, 54, 55], "consist": [2, 4, 5, 10, 13, 15, 17, 24, 30, 38, 40, 41, 50, 55], "optparamspi": [2, 3], "dedic": [2, 10, 17, 36, 37, 38, 55, 56], "do": [2, 4, 5, 13, 19, 20, 21, 24, 26, 35, 36, 40, 43, 46, 53, 55], "adopt": [2, 4, 55], "store": [2, 4, 5, 6, 9, 10, 20, 22, 24, 30, 31, 32, 33, 36, 40, 41, 43, 44, 45, 46, 52, 53, 55], "tabl": [2, 4, 5, 6, 9, 10, 12, 13, 15, 17, 18, 20, 22, 24, 25, 26, 27, 29, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 51, 53, 55, 56], "get": [2, 4, 14, 36, 40, 41, 42, 46, 48, 55], "indic": [2, 4, 5, 9, 20, 21, 22, 24, 26, 30, 32, 33, 38, 55], "segment": [2, 24, 55], "multipl": [2, 4, 5, 8, 9, 10, 20, 22, 24, 25, 26, 35, 36, 38, 39, 41, 50, 55, 56], "span": 2, "node": [2, 4, 5, 14, 17, 24, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 43, 51, 53, 54, 55], "With": [2, 5, 25, 29, 34, 36, 55, 56], "portion": [2, 24], "": [2, 4, 5, 10, 13, 17, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 33, 34, 36, 37, 38, 40, 41, 42, 43, 44, 46, 47, 50, 51], "exist": [2, 5, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 41, 42, 45, 46, 50, 55, 56], "load": [2, 4, 5, 10, 17, 19, 20, 21, 23, 24, 25, 26, 27, 30, 31, 32, 33, 36, 38, 41, 45, 46, 47, 48, 49, 53, 55], "imbal": [2, 55], "oom": 2, "import": [2, 8, 9, 10, 13, 15, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 45, 46, 47, 48, 49, 50, 51, 53, 55], "singl": [2, 4, 36, 40, 41, 42, 50, 54, 55, 56], "assum": [2, 4, 5, 9, 30, 38, 41, 55], "repres": [2, 9, 19, 22, 26, 40, 50], "id": [2, 4, 5, 9, 20, 21, 22, 23, 24, 25, 26, 29, 30, 33, 34, 35, 40, 41, 44], "ar": [2, 4, 5, 6, 9, 10, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 44, 45, 46, 47, 49, 50, 51, 53, 54, 55, 56], "map": [2, 4, 5, 20, 21, 22, 23, 24, 26, 28, 31, 32, 33, 40, 41, 42, 51, 53, 55], "input_key_typ": [2, 4], "By": [2, 5, 13, 35, 36, 43, 50, 55], "32": [2, 4, 5, 6, 8, 21, 23, 25, 29, 30, 32, 33, 34, 40, 41, 42, 43, 46, 47, 51, 53, 55], "bit": [2, 5, 38, 41, 55], "i32": [2, 4], "64": [2, 4, 5, 6, 8, 21, 23, 34, 38, 41, 47], "i64": [2, 4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "allow": [2, 4, 5, 10, 13, 17, 25, 29, 30, 34, 36, 38, 41, 43, 46, 47, 48, 50, 55], "even": [2, 5, 36, 37, 55], "constrain": 2, "addit": [2, 4, 5, 30, 35, 36, 45, 50, 55], "overflow": [2, 31, 32, 33, 55], "verifi": [2, 4, 25, 29, 34, 43, 55], "beyond": [2, 5], "neg": [2, 55], "confid": 2, "disabl": [2, 5, 30, 31, 33, 35, 48, 55], "environ": [2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 38, 40, 41, 42, 43, 53, 54, 55], "variabl": [2, 4, 17, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 41, 53, 55], "hugectr_disable_overflow_check": [2, 55], "23": [2, 4, 6, 10, 17, 23, 24, 25, 30, 32, 33, 34, 40, 41, 42, 47, 48, 53], "sparse_embedding1": [2, 4, 5, 8, 20, 21, 24, 30, 31, 40, 41, 42, 51, 53], "input_data": [2, 42], "unlik": [2, 5, 54], "individu": [2, 4], "locat": [2, 5, 35, 36, 38, 41, 43, 53, 55, 56], "scalabl": [2, 10, 18, 36, 54, 55], "avail": [2, 4, 5, 8, 10, 13, 17, 18, 20, 21, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 36, 38, 39, 40, 41, 42, 43, 46, 49, 54, 55, 56], "togeth": [2, 4, 35, 39, 41, 43, 55], "format": [2, 3, 5, 6, 10, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 38, 40, 41, 42, 45, 50, 51, 54, 55], "other": [2, 4, 5, 8, 9, 10, 18, 20, 21, 22, 23, 24, 26, 30, 32, 33, 35, 36, 41, 43, 44, 50, 54, 55], "equip": [2, 5, 30], "dgx": [2, 40], "a100": [2, 6, 10, 13, 17, 19, 34, 35, 38, 43, 48], "1221": 2, "754": [2, 40], "8": [2, 4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 38, 40, 41, 42, 47, 48, 49, 53], "4": [2, 4, 5, 6, 10, 20, 21, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 38, 40, 42, 45, 47, 49, 50, 51, 53, 54], "12": [2, 4, 6, 20, 21, 23, 24, 26, 28, 31, 32, 33, 40, 41, 42, 47, 51, 53], "49": [2, 20, 23, 32, 33, 40, 41, 42, 47, 51], "128": [2, 4, 5, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 47, 50, 51, 53], "loss": [2, 4, 20, 21, 22, 24, 26, 27, 31, 32, 33, 36, 40, 41, 42, 51, 53, 54, 55], "final": [2, 4, 43, 49, 55], "fuse": [2, 5, 23, 25, 28, 30, 33, 41, 55], "util": [2, 4, 5, 10, 13, 19, 20, 21, 22, 24, 25, 26, 30, 31, 32, 33, 36, 38, 40, 41, 43, 45, 55, 56], "layer_typ": [2, 4, 31, 40, 41, 42, 51, 53], "layer_t": [2, 4, 31, 40, 41, 42, 51, 53, 55], "cast": [2, 31, 32, 33], "innerproduct": [2, 4, 40, 41, 42, 51, 53], "prelu_dic": 2, "str": [2, 4, 5, 8, 9, 20, 21, 22, 23, 24, 26, 27, 28, 32, 33, 40, 42, 49, 51, 55], "top_nam": [2, 4, 31, 40, 41, 42, 51, 53], "output": [2, 4, 6, 9, 14, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35, 40, 41, 42, 43, 46, 48, 51, 53, 55], "num_output": [2, 4, 31, 40, 41, 42, 51, 53], "weight_init_typ": 2, "weight": [2, 4, 6, 9, 10, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 36, 38, 41, 42, 51, 53, 55], "initializer_t": 2, "xaviernorm": 2, "xavieruniform": 2, "zero": [2, 4, 5, 20, 21, 22, 23, 24, 26, 28, 36, 41, 49, 51, 55], "bias_init_typ": 2, "bia": [2, 32, 47, 55], "shape": [2, 4, 6, 9, 14, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 47, 49, 51, 53, 55], "batch_siz": [2, 14, 21, 22, 26, 27, 30, 31, 32, 33, 41, 55], "ani": [2, 4, 5, 8, 10, 20, 21, 22, 23, 24, 26, 27, 28, 32, 35, 36, 40, 41, 42, 53, 55], "relu1": [2, 40, 41, 42, 51, 53], "fc2": [2, 22, 30, 40, 41, 42, 51, 53], "1024": [2, 4, 5, 6, 19, 21, 22, 24, 26, 27, 30, 31, 32, 33, 40, 41, 42, 47, 48, 49, 51, 53, 54], "relu2": [2, 40, 42, 51, 53], "compris": [2, 4, 30, 31, 32, 33, 34, 48, 51], "fulli": [2, 5, 23, 31, 34, 36, 38, 40, 41, 42, 51, 53, 55, 56], "fp16": [2, 6, 24, 30, 36, 55], "fp32": [2, 4, 6, 24, 31, 32, 33, 55], "tf32": [2, 30, 33, 55], "act_typ": [2, 31], "activ": [2, 4, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 54, 55], "activation_t": [2, 31], "use_bia": [2, 31], "boolean": [2, 4, 5], "overrid": [2, 4, 26, 53], "bias": 2, "compute_config": 2, "denselayercomputeconfig": [2, 55], "configur": [2, 4, 6, 8, 9, 10, 12, 13, 15, 17, 18, 19, 23, 28, 35, 36, 38, 40, 41, 51, 53, 55], "valid": [2, 4, 5, 35, 42, 50, 51, 53, 55], "flag": [2, 5, 20, 21, 22, 23, 24, 26, 30, 33, 41, 55], "async_wgrad": [2, 55], "fuse_wb": [2, 55], "wgrad": [2, 55], "asynchron": [2, 4, 5, 19, 38, 55], "dgrad": 2, "fals": [2, 4, 5, 19, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 40, 41, 42, 46, 47, 50, 51, 53, 55], "bgrad": 2, "compute_config_bottom": 2, "compute_config_top": 2, "mlp1": [2, 31], "512": [2, 4, 5, 24, 25, 29, 30, 31, 32, 33, 34, 40, 43, 47, 50, 51, 53], "256": [2, 4, 5, 6, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 47, 53, 55], "interaction1": [2, 31, 40, 53], "interaction_grad": 2, "mlp2": [2, 31], "cross": [2, 35, 38, 40, 41, 42, 53, 54, 55], "network": [2, 4, 5, 14, 17, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 43, 44, 47, 50, 51, 53, 54, 55], "explicit": [2, 19, 24, 30, 31, 32, 33], "two": [2, 4, 5, 10, 18, 19, 21, 24, 27, 30, 35, 36, 40, 50, 51, 53, 55], "invent": 2, "v1": [2, 20, 21, 22, 24, 30, 33, 35, 53, 54], "respect": [2, 4, 5, 10, 55], "n": [2, 5, 9, 24, 26, 30, 31, 32, 33, 40, 41, 42, 47, 50], "mathemat": 2, "formula": [2, 55], "those": [2, 4, 30, 55], "x_": 2, "l": [2, 26, 27, 46, 53], "x": [2, 4, 6, 8, 9, 26, 27, 32, 33, 34, 41, 42, 49, 53], "t": [2, 19, 24, 30, 35, 36, 42, 47, 50, 55], "_": [2, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 40, 42], "w_": 2, "b_l": 2, "x_l": 2, "w_l": 2, "mathbb": 2, "r": [2, 26, 27, 30, 47, 53], "times1": 2, "learnabl": 2, "x_0": 2, "odot": 2, "mathbf": 2, "w": [2, 19, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 41, 43, 55], "elementwis": 2, "dot": 2, "_l": 2, "decreas": [2, 5], "complex": [2, 5, 38, 50], "approxim": [2, 5], "factor": [2, 55], "lower": [2, 5, 35, 38], "matric": 2, "u": [2, 5, 6, 19, 25, 29, 30, 34, 35, 41, 43, 53, 55], "v": [2, 25, 29, 30, 34, 43, 47, 48, 55], "project": [2, 4, 10, 17, 18, 38, 39, 55], "correspondingli": [2, 4, 8, 24], "evolv": 2, "num_lay": [2, 30, 53], "posit": [2, 4, 55], "projection_dim": 2, "degrad": [2, 5, 55], "slice11": [2, 53], "multicross1": [2, 53], "6": [2, 4, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 36, 38, 40, 41, 42, 47, 50, 53], "thefmorder2": 2, "order": [2, 4, 5, 9, 20, 21, 22, 24, 26, 30, 31, 32, 33, 41, 50, 55], "fm": 2, "linear": [2, 32, 47, 54], "pairwis": 2, "product": [2, 5, 10, 19], "latent": 2, "out_dim": [2, 26, 27], "slice32": 2, "10": [2, 4, 5, 6, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 46, 47, 51, 53, 55], "multipli": [2, 9, 47, 55], "space": [2, 5, 30, 42], "weight_dim": 2, "matrix": [2, 4, 9, 36, 51], "slot_dim": 2, "vec_dim": 2, "correctli": [2, 4, 36, 41, 55], "emploi": [2, 4, 5, 28, 30, 31, 32, 33, 55], "result": [2, 4, 5, 9, 24, 28, 30, 31, 32, 33, 35, 36, 41, 50, 54, 55], "wise": [2, 55], "none": [2, 9, 20, 21, 22, 23, 24, 26, 27, 30, 33, 41, 42, 48, 51, 53, 55], "2x": [2, 24], "num_elem": 2, "slice1": 2, "slice2": 2, "eltmultiply1": 2, "implement": [2, 4, 5, 24, 33, 35, 36, 38, 41, 50, 55], "cudnn": [2, 30, 31, 32, 33, 47, 55], "batch": [2, 4, 5, 6, 8, 9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 38, 41, 47, 54, 55], "normal": [2, 40, 41, 42, 50], "float": [2, 4, 5, 9, 30, 32, 33, 47, 48], "exponenti": 2, "averag": [2, 4, 5, 30, 34, 35, 48, 55], "runningmean": 2, "newmean": 2, "ep": [2, 47], "epsilon": [2, 4, 31, 42], "1e": [2, 4, 28, 41, 47, 50], "5": [2, 4, 5, 6, 8, 9, 10, 13, 17, 20, 21, 22, 23, 24, 26, 28, 32, 33, 36, 38, 40, 42, 45, 46, 47, 49, 50, 51, 53], "gamma_init_typ": 2, "gamma": 2, "beta_init_typ": 2, "beta": [2, 4, 32], "00001": [2, 24], "varianc": 2, "file": [2, 3, 5, 6, 8, 9, 10, 12, 15, 19, 20, 21, 22, 23, 24, 26, 27, 28, 35, 36, 38, 40, 41, 42, 43, 45, 46, 47, 50, 51, 54, 55], "my_snapshot_dense_5000": 2, "find": [2, 4, 5, 30, 35, 38, 50, 54, 55], "norm": [2, 4, 9, 38, 55], "shown": [2, 4, 5, 6, 8, 10, 17, 54], "192325": 2, "003050": 2, "323447": 2, "034817": 2, "091861": 2, "var": [2, 31, 32, 33], "738942": 2, "410794": 2, "370279": 2, "156337": 2, "638146": 2, "759954": 2, "251507": 2, "648882": 2, "176316": 2, "515163": 2, "434012": 2, "422724": 2, "001451": 2, "756962": 2, "126412": 2, "851878": 2, "837513": 2, "694674": 2, "791046": 2, "849544": 2, "694500": 2, "405566": 2, "211646": 2, "936811": 2, "659098": 2, "2d": [2, 55], "3d": [2, 55], "seq_len": 2, "4d": [2, 55], "num_attention_head": 2, "concaten": [2, 20, 21, 24, 26, 27, 28, 30, 32, 33, 38, 51, 55], "axi": [2, 6, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33, 42, 45, 48, 55], "dimension": [2, 38, 55], "num_feas_0": 2, "num_elems_0": 2, "num_fea": [2, 26, 27, 32, 33, 55], "num_elems_1": 2, "num_feas_1": 2, "reshape3": 2, "weight_multiply2": 2, "concat2": [2, 26, 27, 33, 53], "leading_dim": [2, 41, 42, 51, 53], "innermost": 2, "total": [2, 4, 5, 9, 10, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 41, 42, 46, 50, 51], "unspecifi": [2, 41], "n_slot": 2, "time_step": 2, "defin": [2, 5, 15, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 42, 45, 53], "selected_slot": 2, "ignor": [2, 4, 30, 32, 33, 41, 42, 53], "destin": [2, 55], "placehold": [2, 17, 24, 30, 31, 32, 33], "cannot": [2, 5, 9, 10, 31, 35, 38, 40, 41, 42, 47, 51, 53, 56], "deprec": [2, 4, 5, 41, 43, 55], "futur": [2, 4, 5, 20, 21, 22, 26, 28, 35, 41, 55], "restrict": [2, 4, 10, 55], "tailing_dim": 2, "reshape1": [2, 26, 33, 41, 42, 51, 53], "416": [2, 32, 41, 42, 53], "dim": [2, 24, 30, 31, 32, 33, 47], "select1": 2, "selct": 2, "extract": [2, 10, 20, 21, 22, 24, 32, 33, 44, 49, 51, 52], "rang": [2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 42, 46, 47, 49, 53, 55], "tupl": [2, 27], "creat": [2, 4, 5, 6, 10, 22, 28, 31, 32, 33, 35, 40, 41, 42, 43, 44, 45, 46, 47, 50, 52, 53, 55], "inclus": 2, "end": [2, 4, 5, 18, 19, 23, 24, 28, 30, 31, 36, 40, 41, 51, 53, 55], "exclus": [2, 19, 30, 55], "overlap": [2, 4, 5, 23, 28, 54, 55], "unless": [2, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 43, 53], "revers": 2, "along": [2, 4, 9, 55], "b": [2, 4, 24, 30, 41], "d": [2, 4, 30, 32, 40, 41, 42, 46, 47, 49, 51, 55], "c": [2, 10, 18, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 43, 50, 55], "len": [2, 21, 22, 23, 26, 27, 28, 30, 32, 40, 41, 42, 46, 47, 49, 51], "actual": [2, 4, 5, 20, 21, 22, 24, 26, 36, 55], "explicitli": [2, 8, 24, 55], "slice21": 2, "slice22": 2, "weight_multiply1": 2, "3": [2, 4, 5, 6, 8, 9, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 36, 37, 38, 40, 42, 45, 47, 49, 50, 51, 53, 54], "copi": [2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 36, 40, 42, 46, 53, 55], "branch": [2, 35, 55], "topologi": [2, 4, 10, 55], "graph": [2, 4, 5, 6, 10, 14, 17, 22, 23, 27, 28, 36, 40, 41, 42, 50, 51, 53, 55], "parser": [2, 30, 31, 32, 33, 40, 42, 55], "intern": [2, 4, 8, 24, 26, 41, 55], "handl": [2, 4, 5, 17, 30, 31, 32, 33, 41, 50, 55], "situat": [2, 5, 41, 55], "behav": 2, "abov": [2, 4, 5, 10, 19, 24, 25, 29, 30, 34, 38, 43], "whilst": 2, "simplifi": [2, 50, 55], "randomli": 2, "zeroiz": 2, "drop": [2, 45, 55], "dropout_r": [2, 42, 53], "rate": [2, 4, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 37, 38, 39, 41, 45, 50, 51, 55], "between": [2, 4, 5, 18, 30, 34, 36, 40, 41, 50, 55], "dropout1": [2, 42, 53], "unit": [2, 4, 20, 21, 22, 23, 24, 26, 27, 33, 35, 54, 55], "elu_alpha": 2, "scalar": [2, 55], "satur": 2, "fc1": [2, 4, 22, 30, 40, 41, 42, 51, 53], "elu1": 2, "rectifi": 2, "sigmoid1": 2, "NOT": [2, 24, 53], "captur": 2, "typic": [2, 4, 5, 9], "output_dim": 2, "layer1": [2, 47], "layer3": [2, 47], "arbitrari": [2, 9, 36, 55], "manner": [2, 4, 5, 8, 10, 35, 43, 55], "nx": [2, 54], "fc4": [2, 40, 53], "reducesum1": 2, "reducesum2": 2, "remain": [2, 10, 13, 17, 38, 55], "gate": 2, "recurr": 2, "batchsiz": [2, 4, 20, 21, 22, 24, 26, 27, 31, 32, 33, 40, 41, 42, 47, 51, 53], "seqlength": 2, "sequenc": [2, 4, 20, 21, 26, 55], "vector_s": 2, "gru1": 2, "conncat1": 2, "20": [2, 4, 5, 20, 21, 22, 23, 24, 26, 27, 32, 33, 40, 41, 47, 49, 51, 53, 54], "parametr": 2, "adapt": [2, 41], "adjust": [2, 5, 30, 55], "point": [2, 27], "prelu": 2, "dice": 2, "fc_din_i1": 2, "dice_1": 2, "specif": [2, 4, 5, 18, 20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 42, 44, 50, 53, 55], "item1": 2, "scale_item": 2, "sparse_embedding_good": 2, "sparse_embedding_c": 2, "fusedreshapeconcat_item_his_em": 2, "fusedreshapeconcat_item": 2, "accept": [2, 4, 14, 40, 41], "need": [2, 4, 5, 10, 13, 18, 19, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 35, 38, 40, 41, 46, 50, 51, 53, 55], "mask": [2, 26, 27, 55], "10000": [2, 4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 42], "step": [2, 4, 5, 6, 8, 10, 20, 21, 22, 23, 24, 26, 27, 31, 32, 33, 34, 35, 36, 40, 41, 50, 53, 55], "softmax_i": 2, "y": [2, 6, 32, 50], "produc": [2, 4, 22, 26, 30, 55], "scale_item1": 2, "item_his1": 2, "sub_ih": 2, "reducemean1": 2, "mutipl": 2, "m": [2, 5, 6, 9, 19, 30, 33, 40, 41, 47, 49, 50, 55], "h": [2, 19, 30, 33, 41], "matrixmutiply1": 2, "text": [2, 4, 24, 43, 44, 49, 50, 51, 52], "cdot": 2, "q": [2, 20, 21, 22, 23, 24, 28, 32, 33, 35, 51], "inner": 2, "pad": [2, 4, 47], "due": [2, 15, 22, 33, 55], "inequ": 2, "attent": [2, 55], "head": [2, 35, 42, 45, 46, 47, 49, 50, 51, 55], "seq_from": 2, "hidden_dim": 2, "seq_to": 2, "queri": [2, 5, 10, 19, 38, 41, 55], "attention_out": 2, "mark": 2, "make": [2, 4, 5, 10, 19, 20, 21, 25, 26, 27, 30, 35, 36, 38, 40, 41, 42, 43, 44, 48, 50, 51, 53, 55], "sure": [2, 5, 19, 30, 35, 36, 41, 42, 50, 53, 55], "max_sequence_len_from": 2, "max_sequence_len_to": 2, "sequence_mask": 2, "eight": [2, 54], "num_indic": 2, "gather1": 2, "predict": [2, 3, 5, 31, 32, 33, 41, 50, 51, 55], "use_regular": 2, "regulari": 2, "THe": 2, "regularizer_typ": 2, "regular": [2, 5, 30, 55], "regularizer_t": 2, "l1": 2, "l2": [2, 9], "lambda": [2, 20, 21, 22, 24, 30, 33, 50], "term": [2, 4, 55], "use_regulari": 2, "propag": [2, 4, 5, 17, 41, 55], "phase": [2, 55], "backward": [2, 4, 32, 55], "v3": [2, 55], "7": [2, 4, 10, 13, 17, 20, 21, 22, 23, 24, 26, 28, 30, 32, 33, 37, 38, 40, 41, 42, 47, 53, 54], "releas": [2, 4, 19, 24, 30, 33, 35, 41, 43, 50, 53, 54], "enabl": [2, 4, 5, 6, 10, 13, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 51, 53, 55], "placement": [2, 5, 55], "strategi": [2, 8, 19, 22, 25, 55], "compar": [2, 5, 6, 28, 41, 54, 55], "three": [2, 4, 5, 6, 18, 19, 30, 34, 35, 38, 54, 55], "advantag": [2, 5, 55, 56], "previou": [2, 5, 24, 51, 55], "enhanc": [2, 54, 55], "boost": [2, 36, 55], "flexibl": [2, 18, 55], "lookup": [2, 6, 9, 10, 12, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 36, 38, 55], "parallel": [2, 4, 5, 10, 38, 40, 46, 55, 56], "object": [2, 4, 5, 20, 21, 22, 24, 30, 33, 41, 42, 50, 55], "max_vocabulary_s": [2, 20, 22, 24, 26, 27, 32, 33, 40], "ev_siz": [2, 40], "config": [2, 8, 19, 23, 24, 26, 27, 30, 31, 32, 33, 35, 40, 41, 53, 55], "organ": [2, 4], "nccl_launch_mod": 2, "group": [2, 4, 5, 30, 35, 50, 55], "potenti": [2, 44, 55], "hang": [2, 55], "mix": [2, 4, 5, 24, 31, 40, 41, 42, 51, 53, 55, 56], "precis": [2, 4, 5, 24, 31, 40, 41, 42, 51, 53, 55], "attribut": [2, 15, 41], "dump": [2, 4, 23, 26, 27, 28, 31, 36, 41, 42, 46, 47, 48, 51, 53, 55], "contain": [2, 4, 5, 6, 8, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 36, 41, 43, 44, 45, 46, 47, 48, 50, 53, 54, 55], "incorrectli": [2, 55], "receiv": [2, 5, 10, 22, 26], "error": [2, 4, 5, 24, 30, 31, 33, 35, 41, 46, 47, 55], "know": [2, 5, 19, 55], "opt_param": [2, 4], "greater": [2, 4, 5, 19, 55], "sgd": [2, 4, 40, 53, 55], "adagrad": [2, 4, 55], "momentumsgd": [2, 4], "nesterov": [2, 4, 55], "rmsprop": 2, "adam": [2, 4, 20, 21, 22, 24, 27, 31, 32, 33, 41, 42, 51, 54, 55], "ftrl": [2, 4, 55], "203931": [2, 40], "18598": [2, 40], "14092": [2, 40], "7012": [2, 40], "18977": [2, 40], "6385": [2, 40], "1245": [2, 40], "186213": [2, 40], "71328": [2, 40], "67288": [2, 40], "11": [2, 6, 23, 24, 28, 30, 31, 32, 33, 40, 41, 42, 47, 48, 51, 53], "2168": [2, 40], "7338": [2, 40], "61": [2, 23, 40, 42, 47], "932": [2, 31, 40], "15": [2, 5, 8, 23, 30, 32, 33, 40, 41, 42, 47, 51, 53, 55], "204515": [2, 40], "141526": [2, 40], "199433": [2, 40], "60919": [2, 40], "9137": [2, 40], "71": [2, 23, 26, 40, 47], "34": [2, 23, 32, 33, 40, 41, 42, 47, 51, 53], "embedding_table_list": [2, 40], "append": [2, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 46, 47], "table_": 2, "use_exclusive_kei": [2, 40], "bool": [2, 5], "comm_strategi": [2, 55], "communicationstrategi": 2, "table_config": [2, 40], "major": [2, 4, 9, 38, 55], "arg": [2, 9, 20, 21, 22, 24, 26, 27, 30, 32, 33, 35, 40, 41, 42, 46], "abl": [2, 5, 19, 36, 55], "address": [2, 4, 5, 25, 29, 31, 34, 41, 43, 55], "challeng": [2, 10, 55], "we": [2, 4, 5, 6, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 38, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 53, 54, 55], "etp": 2, "significantli": [2, 5, 30, 31, 32, 33, 55], "influenc": 2, "shard_matrix": [2, 40, 55], "num_gpu": [2, 23, 24, 28, 40, 42], "row": [2, 4, 9, 49, 50, 51], "place": [2, 24, 38, 40, 42, 55], "th": [2, 4], "shard_strategi": [2, 40], "mp": [2, 36, 40, 41, 56], "dp": [2, 40, 56], "t0": 2, "t1": 2, "t2": 2, "t3": 2, "And": [2, 4, 53, 55], "embedding_table_nam": [2, 5, 8, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "good": [2, 5, 41], "userid": [2, 45, 50, 51], "ebc_config": [2, 40], "num_tabl": [2, 23, 24, 28, 31, 32, 55], "sparse_embed": [2, 4], "interfac": [3, 35, 36, 38, 41, 55], "level": [3, 18, 50, 55], "createsolv": [3, 31, 40, 41, 42, 51, 53, 55], "asyncparam": [3, 55], "hybridembeddingparam": [3, 55], "datareaderparam": [3, 31, 40, 41, 42, 51, 53, 55], "createoptim": [3, 31, 40, 41, 42, 51, 53], "layer": [3, 5, 6, 7, 8, 10, 12, 13, 17, 18, 23, 25, 28, 30, 31, 32, 34, 36, 38, 40, 41, 42, 47, 48, 50, 53, 54, 55, 56], "compil": [3, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 30, 31, 33, 35, 38, 40, 41, 42, 51, 53, 55], "fit": [3, 10, 31, 36, 40, 41, 42, 50, 51, 53, 55, 56], "summari": [3, 20, 21, 22, 23, 24, 26, 27, 30, 31, 33, 40, 41, 42, 51, 53], "graph_to_json": [3, 31, 41, 42, 51, 53, 55], "construct_from_json": 3, "load_dense_weight": 3, "load_dense_optimizer_st": 3, "load_sparse_weight": [3, 51], "load_sparse_optimizer_st": 3, "freeze_dens": 3, "freeze_embed": [3, 51, 55], "unfreeze_dens": 3, "unfreeze_embed": [3, 55], "reset_learning_rate_schedul": 3, "set_sourc": 3, "low": [3, 5, 10, 13, 17, 18, 20, 21, 22, 24, 26, 27, 28, 32, 33, 36], "learningrateschedul": 3, "get_next": 3, "dataread": [3, 31, 40, 41, 42, 51, 53, 55], "is_eof": 3, "get_learning_rate_schedul": 3, "get_data_reader_train": 3, "get_data_reader_ev": 3, "start_data_read": 3, "set_learning_r": 3, "get_current_loss": 3, "eval": [3, 31, 40, 41, 42, 47, 51, 53, 55], "get_eval_metr": 3, "check_out_tensor": [3, 41, 55], "infer": [3, 6, 8, 10, 13, 17, 18, 19, 25, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 43, 51, 55, 56], "inferenceparam": [3, 5, 41, 55], "inferencemodel": [3, 5, 20, 21, 23, 24, 26, 55], "datageneratorparam": [3, 31, 38, 41, 55], "datagener": [3, 31, 38, 41, 55], "datasourceparam": [3, 53, 55], "input": [3, 4, 5, 6, 9, 14, 19, 20, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33, 36, 38, 40, 41, 42, 44, 45, 47, 48, 50, 51, 53, 55], "embed": [3, 4, 6, 9, 10, 12, 13, 15, 17, 18, 20, 21, 23, 24, 25, 28, 29, 31, 32, 33, 34, 36, 37, 38, 42, 44, 49, 50, 52, 53, 55, 56], "distributedslotsparseembeddinghash": [3, 4, 31, 41, 42, 51, 53], "dens": [3, 4, 5, 6, 9, 10, 17, 20, 21, 22, 23, 24, 26, 27, 30, 31, 32, 33, 36, 38, 40, 41, 42, 51, 53, 55], "fullyconnect": [3, 55], "mlp": [3, 6, 26, 27, 31, 32, 33, 55], "multicross": [3, 53, 55], "fmorder2": [3, 55], "weightmultipli": 3, "elementwisemultipli": 3, "batchnorm": 3, "layernorm": 3, "concat": [3, 20, 21, 22, 23, 24, 30, 32, 33, 40, 41, 42, 51, 53, 55], "reshap": [3, 20, 21, 22, 23, 24, 26, 27, 32, 33, 41, 42, 51, 53, 55], "select": [3, 19, 55], "dropout": [3, 42, 53, 54, 55], "elu": [3, 55], "relu": [3, 22, 26, 27, 31, 32, 33, 40, 41, 42, 47, 51, 53, 54, 55], "sigmoid": [3, 22, 26, 27, 31, 32, 33, 41, 55], "interact": [3, 10, 13, 17, 19, 25, 26, 27, 29, 31, 32, 33, 34, 36, 38, 40, 43, 53, 54, 55], "reducesum": [3, 42, 55], "gru": [3, 55], "preludic": [3, 55], "scale": [3, 36, 37, 38, 50, 55], "fusedreshapeconcat": [3, 55], "fusedreshapeconcatgener": [3, 55], "softmax": [3, 22, 26, 55], "reducemean": [3, 55], "matrixmutipli": 3, "multiheadattent": [3, 55], "sequencemask": [3, 55], "gather": [3, 32, 33, 46, 55], "binarycrossentropyloss": [3, 31, 40, 41, 42, 51, 53], "crossentropyloss": [3, 55], "multicrossentropyloss": [3, 55], "overview": [3, 4, 5, 40], "us": [3, 4, 5, 6, 8, 9, 14, 15, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 34, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56], "known": 3, "embeddingtableconfig": [3, 40], "embeddingcollectionconfig": [3, 40, 55], "embedding_lookup": [3, 6, 9, 20, 21, 23, 24, 30, 33, 40], "shard": [3, 22, 40, 55, 56], "As": [4, 5, 20, 21, 24, 26, 27, 36, 51, 55], "domain": [4, 44, 45], "framework": [4, 10, 13, 17, 18, 20, 24, 28, 34, 35, 36, 37, 38, 39, 41, 54, 55, 56], "focu": 4, "algorithm": [4, 5, 22, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "job": [4, 20, 21, 22, 23, 24, 26, 33, 41, 55], "automat": [4, 5, 10, 24, 50, 55], "deploi": [4, 5, 6, 8, 9, 10, 13, 17, 18, 19, 20, 21, 22, 25, 26, 37, 42, 43, 55], "hardwar": [4, 5, 30, 33, 55], "complet": [4, 24, 30, 31, 32, 33, 41, 46, 55], "without": [4, 5, 18, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 53, 55], "manual": [4, 20, 21, 23, 24, 26, 55], "been": [4, 20, 24, 31, 32, 33, 41, 54, 55], "wrap": [4, 22, 27, 36, 43, 56], "meanwhil": [4, 36], "maintain": [4, 5, 10, 35, 55], "who": [4, 55], "control": [4, 5, 19, 24, 30, 31, 32, 33, 55], "friendli": 4, "alreadi": [4, 5, 31, 40, 42, 43, 49, 50, 55], "deep": [4, 10, 18, 20, 21, 22, 23, 24, 26, 30, 35, 36, 37, 38, 50, 51, 54, 55, 56], "learn": [4, 10, 18, 37, 38, 50, 54, 55, 56], "like": [4, 5, 10, 19, 53, 55, 56], "kera": [4, 20, 21, 22, 23, 24, 26, 27, 30, 33, 55], "worthwhil": 4, "switch": [4, 41, 55], "notebook": [4, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 36, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55], "workflow": [4, 6, 36, 42, 50, 51, 55], "lot": [4, 30, 55], "core": [4, 6, 20, 21, 22, 23, 24, 26, 30, 33, 34, 41, 42, 54, 55], "structur": [4, 5, 10, 31, 40, 41, 42, 53, 55], "epoch": [4, 31, 40, 41, 42, 51, 53, 55], "simpli": [4, 30, 35, 41, 54, 55], "moreov": 4, "give": [4, 30, 50, 55], "save": [4, 10, 22, 23, 24, 27, 30, 31, 32, 33, 36, 41, 42, 45, 50, 53, 55], "statu": [4, 8, 24, 30, 31, 32, 33, 41, 42, 48], "etc": [4, 19, 37, 40, 55], "return": [4, 5, 8, 9, 12, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 47, 50, 55], "custom": [4, 10, 13, 17, 24, 30, 31, 32, 33, 35, 53, 55], "model_nam": [4, 5, 6, 9, 12, 15, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "empti": [4, 5, 9, 20, 21, 24, 26, 33, 41, 55], "seed": [4, 26, 31, 40, 41, 42, 51, 53], "lr_polici": 4, "polici": [4, 5], "suppot": 4, "fix": [4, 5, 35, 55], "lrpolicy_t": 4, "lr": [4, 31, 32, 40, 41, 42, 51, 53], "schedul": [4, 5, 42, 55], "001": [4, 31, 40, 41, 42, 53], "warmup_step": [4, 31, 36, 40, 41, 42, 51, 53], "warmup": [4, 19, 31, 40, 41, 42, 51, 53], "within": [4, 5, 10, 13, 23, 38, 43, 47, 48, 54, 55], "decay_start": [4, 31, 36, 40, 41, 42, 51, 53], "decai": [4, 36], "decay_step": [4, 31, 36, 40, 41, 42, 51, 53], "decay_pow": [4, 31, 40, 41, 42, 51, 53], "power": [4, 5, 19, 31, 38, 41, 55], "end_lr": [4, 31, 40, 41, 42, 51, 53], "max_eval_batch": [4, 31, 40, 41, 42, 51, 53, 55], "equal": [4, 5, 19, 21, 23, 27, 28, 41, 55], "bigger": [4, 50], "bathc": 4, "100": [4, 5, 19, 23, 27, 28, 30, 40, 47, 48, 51, 53], "batchsize_ev": [4, 31, 40, 41, 42, 51, 53, 55], "minibatch": 4, "2048": [4, 6, 30, 47, 49, 51], "here": [4, 19, 20, 21, 22, 23, 24, 25, 26, 29, 30, 34, 35, 36, 38, 40, 41, 43, 53, 54], "worker": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 51, 53, 55], "vvgpu": [4, 31, 40, 41, 42, 51, 53], "physic": 4, "numa": [4, 31, 40, 41, 42, 51, 53, 55], "possibl": [4, 18, 36, 41, 55], "repeat_dataset": [4, 31, 40, 41, 42, 51, 53], "repeat": [4, 19, 47], "otherwis": [4, 5, 24, 42, 55], "use_mixed_precis": [4, 5, 31, 51, 53], "enable_tf32_comput": 4, "acceler": [4, 6, 17, 30, 33, 36, 37, 38, 39, 50, 55, 56], "fullyconnectedlay": [4, 36], "interactionlay": [4, 36, 55], "scaler": [4, 5, 31, 40, 41, 42, 51, 53], "metrics_spec": [4, 40], "metric": [4, 6, 19, 20, 21, 24, 26, 30, 34, 55], "auc": [4, 31, 41, 42, 51, 53, 55], "averageloss": [4, 40], "hitrat": [4, 55], "threshold": [4, 5, 20, 21, 22, 23, 24, 26, 31, 32, 33, 41, 55], "metricstyp": [4, 40], "8025": 4, "termin": [4, 35], "reach": [4, 19], "i64_input_kei": [4, 5, 23, 28, 30, 31, 33, 40, 41, 42, 51, 53], "choos": [4, 40, 53], "nvtabular": [4, 38, 43, 44, 45, 51, 52, 55], "use_algorithm_search": [4, 5], "search": [4, 5, 30, 31, 32, 33, 55], "cublasgemmex": [4, 5], "use_cuda_graph": [4, 5, 31, 41, 53, 55], "cuda": [4, 5, 24, 28, 30, 31, 32, 33, 40, 41, 42, 43, 47, 48, 51, 53, 55], "asyncdataread": 4, "hybridembed": 4, "task": [4, 5, 10, 19, 20, 21, 22, 23, 24, 25, 26, 28, 33, 35, 36, 41, 43, 44, 46, 55], "pack": [4, 5, 20, 21, 22, 23, 24, 28, 32, 33, 51, 55], "device_layout": 4, "longer": [4, 50, 55], "train_intra_iteration_overlap": [4, 55], "detect": [4, 30, 31, 32, 33], "toplogi": [4, 55], "tri": [4, 5], "train_inter_iteration_overlap": [4, 55], "fetch": [4, 46, 55], "next": [4, 30, 32, 46, 47, 50, 51, 55], "earlier": 4, "eval_intra_iteration_overlap": [4, 55], "knob": [4, 55], "similar": [4, 30, 31, 32, 33, 50, 55], "eval_inter_iteration_overlap": [4, 55], "all_reduce_algo": [4, 55], "allreducealgo": [4, 55], "oneshot": 4, "multi": [4, 5, 21, 34, 35, 38, 42, 43, 45, 46, 50, 53, 54, 55], "requir": [4, 5, 6, 10, 15, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 40, 41, 42, 43, 49, 50, 51, 53, 55], "run": [4, 5, 8, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 41, 42, 47, 48, 53, 54, 55], "grouped_all_reduc": 4, "gradient": [4, 20, 21, 22, 24, 26, 27, 33, 55], "effect": [4, 24, 44, 46, 55], "small": [4, 5, 6, 38, 40, 41, 46, 55], "higher": [4, 5, 24, 46, 55], "hybrid": [4, 6, 27, 55], "num_iterations_statist": 4, "statist": [4, 5, 50], "300": [4, 22, 40, 47, 51, 53], "16384": [4, 6, 8, 30, 41, 54], "read": [4, 5, 30, 31, 32, 33, 38, 41, 46, 47, 50, 53, 54, 55], "done": [4, 26, 30, 31, 40, 41, 42, 50, 51, 53], "async_param": 4, "linux": [4, 24, 31, 41], "aio": 4, "peak": [4, 30, 31, 32, 33], "throughput": [4, 5, 19, 30, 36, 55], "num_thread": [4, 5, 55], "least": [4, 5, 9, 24, 28, 55], "num_batches_per_thread": 4, "work": [4, 8, 14, 18, 20, 21, 22, 26, 30, 35, 41, 50, 55], "simultan": [4, 36, 56], "max_num_requests_per_thread": 4, "io": [4, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 42, 43, 50, 53, 55], "request": [4, 5, 6, 19, 24, 30, 31, 32, 33, 35, 41, 50, 55], "72": [4, 23, 33, 34, 47], "most": [4, 5, 13, 19, 30, 33, 41, 55], "multi_hot_read": 4, "io_depth": 4, "queue": [4, 5, 6, 30, 55], "io_align": [4, 55], "byte": [4, 5, 10, 28, 30, 31, 32, 33, 41, 47, 50], "align": [4, 28, 55], "4096": [4, 6, 30, 31, 32, 33, 34, 41], "shuffl": [4, 32, 42, 50], "fed": [4, 30, 38], "aligned_typ": 4, "alignment_t": 4, "auto": [4, 24, 31, 32, 33, 41], "chosen": [4, 5], "obtain": [4, 10, 13, 20, 21, 22, 23, 24, 26, 27, 28, 30, 38, 40, 42, 50, 53], "unsign": 4, "is_dense_float": 4, "except": [4, 20, 21, 22, 23, 24, 26, 27, 28, 40, 41, 42, 46, 47, 53, 55], "thrown": 4, "param": [4, 20, 21, 22, 23, 24, 26, 30, 33], "16": [4, 5, 8, 9, 10, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 40, 41, 42, 47, 50, 51, 53, 54, 55], "overcom": [4, 55], "constraint": [4, 5, 30, 55], "impos": [4, 30, 55], "part": [4, 5, 19, 30, 37, 45, 55], "traffic": [4, 55], "over": [4, 5, 19, 35, 50, 54, 55], "improv": [4, 5, 22, 36, 44, 55], "deploy": [4, 5, 6, 10, 18, 20, 21, 24, 26, 30, 34, 35, 36, 55], "convers": [4, 30, 33, 41, 42, 55], "encod": [4, 51], "hybrid_embedding_param": 4, "max_num_frequent_categori": 4, "frequent": [4, 5, 50, 55], "categori": [4, 5, 30, 36, 50, 51, 55], "max_num_infrequent_sampl": 4, "infrequ": [4, 55], "p_dup_max": 4, "probabl": [4, 19, 38], "appear": [4, 19, 30, 38, 55], "onc": [4, 8, 33, 35, 41, 50, 55], "wai": [4, 10, 13, 17, 19, 25, 29, 30, 34, 38, 40, 43, 50, 54, 55], "determin": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "nvlink": [4, 34], "max_all_reduce_bandwidth": 4, "max_all_to_all_bandwidth": [4, 55], "efficiency_bandwidth_ratio": 4, "communication_typ": [4, 55], "being": [4, 19, 46, 55], "communicationtyp": [4, 55], "ib_nvlink": [4, 55], "ib_nvlink_hi": [4, 55], "nvlink_singlenod": 4, "protocol": [4, 42, 46, 47, 48, 55], "infiniband": [4, 5], "roce": [4, 55], "special": [4, 36], "gid": [4, 55], "hugectr_roce_gid": [4, 55], "hugectr_roce_tc": [4, 55], "hybrid_embedding_typ": 4, "hybridembeddingtyp": 4, "now": [4, 22, 30, 31, 32, 33, 42, 46, 49, 50, 55], "01": [4, 19, 24, 26, 27, 30, 31, 32, 33, 40, 41, 44, 47, 51, 53, 55], "3e11": 4, "9e11": 4, "warn": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "data_reader_typ": [4, 31, 40, 41, 42, 51, 53], "datareadertype_t": [4, 31, 40, 41, 42, 51, 53, 55], "file_list": [4, 31, 38, 41, 53], "txt": [4, 31, 38, 40, 41, 42, 51, 53, 55], "train_data": 4, "bin": [4, 19, 41, 49], "keyset": [4, 55], "show": [4, 5, 8, 18, 19, 20, 24, 25, 26, 33, 40, 41, 46, 54, 55], "eval_sourc": [4, 31, 40, 41, 42, 51, 53], "check_typ": [4, 31, 40, 41, 42, 51, 53], "mechan": [4, 5, 38, 41, 42, 55], "check_t": [4, 31, 40, 41, 42, 51, 53], "checksum": [4, 53], "cache_eval_data": 4, "num_sampl": [4, 20, 21, 22, 24, 26, 27, 32, 33, 55], "eval_num_sampl": 4, "float_label_dens": 4, "interpret": [4, 55], "log": [4, 25, 29, 30, 31, 32, 33, 34, 35, 38, 41, 42, 43, 54, 55], "f": [4, 19, 20, 21, 22, 23, 24, 28, 30, 32, 33, 35, 41, 42, 46, 47, 48, 49, 51], "num_work": [4, 32, 55], "concurr": [4, 5, 19, 30, 55], "empir": 4, "data_source_param": [4, 53, 55], "hdf": [4, 5, 35, 43, 55], "aw": [4, 5, 35, 43, 55], "s3": [4, 5, 35, 43, 55], "googl": [4, 55], "cloud": [4, 13, 17, 25, 29, 34, 43, 55], "async": [4, 41, 55], "fig": [4, 10, 17, 18, 31, 32, 33, 36, 38, 54], "minimum": [4, 6, 25, 29, 30, 34, 43, 55], "granular": [4, 55], "header": [4, 24, 38, 41, 42, 55], "tabular": [4, 44, 50], "alwai": [4, 9, 55], "constant": [4, 30, 32, 33, 41], "payment": 4, "preced": [4, 18, 55], "yellow": 4, "box": [4, 50], "depict": 4, "reserv": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "signific": [4, 5, 22, 41], "exclud": 4, "charg": [4, 41], "definit": [4, 41], "typedef": 4, "struct": [4, 20, 21, 22, 23, 24, 26, 27, 28, 32, 33, 51, 55], "datasetheader_": 4, "error_check": 4, "check_num": 4, "number_of_record": 4, "datasethead": 4, "data_": 4, "check_sum": 4, "char": [4, 15, 41], "checkbit": 4, "slot_": 4, "changeabl": 4, "45": [4, 23, 30, 32, 33, 40, 41, 42, 47, 51, 53, 54], "67": [4, 23, 47], "undefin": [4, 31, 55], "behavior": [4, 5, 30, 41, 55], "given": [4, 9, 45], "assign": [4, 5, 24, 30, 31, 32, 33, 35, 41, 51, 55], "line": [4, 30, 33, 40, 41, 42, 43, 55], "path": [4, 5, 19, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 40, 42, 45, 46, 47, 50, 51, 53, 55], "cat": [4, 28, 42, 50, 53], "simple_sparse_embedding_file_list": 4, "simple_sparse_embed": 4, "simple_sparse_embedding0": 4, "simple_sparse_embedding1": 4, "simple_sparse_embedding2": 4, "simple_sparse_embedding3": 4, "simple_sparse_embedding4": 4, "simple_sparse_embedding5": 4, "simple_sparse_embedding6": 4, "simple_sparse_embedding7": 4, "simple_sparse_embedding8": 4, "simple_sparse_embedding9": 4, "wdl_norm": 4, "file_list_test": [4, 31, 38, 41, 53], "aspect": 4, "datatyp": [4, 24, 31, 32, 33, 41], "outperform": 4, "disk": [4, 30, 45, 50, 55], "feed": [4, 33, 38, 41, 50], "go": [4, 35, 40, 41, 42, 43, 50], "incorpor": [4, 13], "3g": [4, 55], "wdl_raw": 4, "validation_data": 4, "column": [4, 41, 42, 45, 49, 50, 51, 55], "orient": 4, "open": [4, 5, 10, 13, 17, 20, 21, 22, 23, 24, 28, 30, 31, 32, 33, 36, 38, 39, 41, 46, 47, 48, 49, 51, 55], "free": [4, 41, 42, 55], "apach": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "hadoop": [4, 35, 36, 43, 53, 55], "ecosystem": 4, "compress": [4, 38], "nest": [4, 55], "loader": [4, 23, 24, 28, 30, 31, 32, 33, 41], "miss": [4, 5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 47, 51, 55], "int64": [4, 5, 9, 10, 12, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 41, 42, 49, 50, 55], "arrang": 4, "numer": [4, 5, 38, 44], "separ": [4, 5, 10, 20, 21, 24, 26, 27, 31, 41, 50, 55], "_metadata": [4, 50, 53, 55], "file_stat": [4, 53], "file_nam": [4, 53], "file0": 4, "num_row": [4, 53], "409600": 4, "file1": 4, "col_nam": [4, 53], "c1": [4, 53], "c2": [4, 53], "c3": [4, 53], "c4": [4, 53], "cont": [4, 42, 53], "i1": 4, "i2": 4, "i3": 4, "parquet_data": 4, "_file_list": [4, 40, 42, 51], "val": [4, 31, 40, 41, 42, 53], "50000": [4, 24], "20000": [4, 20, 21, 24, 42], "whose": [4, 24, 25, 26, 40, 55], "duplic": [4, 36, 50, 55], "ensur": [4, 5, 8, 13, 19, 23, 28, 30, 41, 50, 55], "snippet": 4, "0th": 4, "1st": [4, 21, 40], "third": [4, 18, 19, 35, 43, 55], "60000": 4, "entri": [4, 21, 22, 26, 33, 55], "resid": 4, "folder": [4, 19, 24, 26, 30, 31, 40, 41, 55], "basic": [4, 9, 10, 12, 41], "four": [4, 55], "frame": 4, "edit": [4, 35], "desir": [4, 10, 30, 41, 55], "chang": [4, 5, 19, 20, 21, 26, 30, 36, 50, 55, 56], "hyperparamet": [4, 36, 41], "well": [4, 50, 55], "meticul": 4, "update_typ": [4, 31, 40, 42, 53], "hit": [4, 5, 19, 20, 21, 22, 23, 24, 26, 31, 32, 33, 41, 50, 51, 55], "lazyglob": 4, "semant": [4, 55], "optimizer_typ": [4, 31, 40, 41, 42, 51, 53], "optimizer_t": [4, 31, 40, 41, 42, 51, 53], "update_t": [4, 31, 40, 42, 53], "beta1": [4, 31, 42], "9": [4, 5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 38, 41, 42, 47, 48, 53], "beta2": [4, 31, 42], "999": [4, 31, 42], "lambda1": 4, "lambda2": 4, "momentum_factor": 4, "atomic_upd": [4, 40, 53], "atom": [4, 41], "0000001": [4, 42], "groupdens": 4, "hugectr_layer_book": 4, "trane": 4, "reader_param": 4, "groupdenselay": [4, 55], "embeddingcollect": 4, "seri": [4, 37, 43, 44], "taken": [4, 9], "dense_lay": 4, "overload": [4, 50, 55], "flexibli": 4, "buffer": [4, 5, 26, 41, 55], "loss_nam": 4, "loss_weight": 4, "match": [4, 5, 8, 24, 30, 38], "through": [4, 5, 10, 13, 36, 37, 38, 39, 41, 45, 47, 49, 50, 55], "num_epoch": [4, 55], "max_it": [4, 31, 40, 41, 42, 51, 53, 55], "2000": [4, 19, 21, 42, 51, 53], "displai": [4, 31, 40, 41, 42, 43, 51, 53, 55], "200": [4, 24, 26, 27, 30, 31, 40, 41, 51, 53], "eval_interv": [4, 31, 40, 41, 42, 51, 53], "execut": [4, 6, 8, 10, 24, 30, 33, 35, 41, 47, 48, 51, 55], "1000": [4, 10, 19, 21, 27, 28, 31, 40, 41, 42, 47, 51, 53, 55], "invalid": 4, "remot": [4, 5, 43, 55], "gc": [4, 5, 53, 55], "localhost": [4, 5, 6, 20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 41, 55], "9000": [4, 5, 42, 53, 55], "dir": [4, 5, 19, 30, 31, 32, 33, 50], "virtual": [4, 5, 41], "style": [4, 5, 55], "region": [4, 5, 53], "offici": [4, 5, 55], "uri": [4, 5, 55], "bucket": [4, 5], "url": [4, 5, 18, 24, 35, 46, 55], "http": [4, 5, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 45, 47, 48, 49, 50, 53, 55], "googleapi": [4, 5, 40, 42, 53], "com": [4, 5, 13, 17, 19, 24, 25, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 47, 49, 50, 53, 55], "mpi": [4, 31, 40, 41, 42, 43, 51, 53, 55], "print": [4, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 46, 47, 50, 51, 55], "graph_config_fil": [4, 42, 51, 53], "fine": [4, 55], "tune": 4, "include_dense_network": 4, "whole": [4, 10, 30, 36, 56], "dense_opt_states_fil": [4, 55], "\u2170": 4, "sparse_embedding_fil": 4, "\u2171": 4, "sparse_embedding_files_map": 4, "dict": [4, 8, 20, 21, 22, 24, 26, 27, 32, 33, 41, 46], "sparse_embedding2": [4, 5, 41, 42], "358": [4, 24], "wdl_0_sparse_4000": 4, "wdl_1_sparse_4000": 4, "sparse_opt_states_fil": [4, 55], "sparse_opt_states_files_map": 4, "freez": [4, 32], "criteo": [4, 30, 38, 40, 42, 54, 55], "embedding_nam": 4, "unfreez": 4, "reset": [4, 41, 55], "base_lr": 4, "under": [4, 8, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 50, 53, 55], "On": [4, 8, 40, 55], "basi": [4, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "expos": 4, "elabor": 4, "datareader32": 4, "datareader64": 4, "re": [4, 30, 35, 38, 41, 46, 55], "form": [4, 25, 38, 41, 55], "begin": [4, 5, 28, 30, 33], "train_data_read": 4, "eval_data_read": 4, "enter": [4, 41], "loop": [4, 22, 33, 41, 50], "later": [4, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 50, 55], "emb_vector": [4, 9, 10, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 51, 53], "distributedslotembed": [4, 36], "slot_id": 4, "localizedslotembed": [4, 36], "info": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 50, 51, 53, 55], "nth": 4, "suffix": [4, 41], "latest": [4, 55], "via": [4, 5, 6, 10, 28, 30, 41, 49, 55], "numpi": [4, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 47, 48, 49, 50, 51, 55], "float32": [4, 9, 10, 12, 14, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 49, 50, 55], "float16": 4, "flow": 4, "debug": [4, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 40, 41, 42, 53, 55], "correct": [4, 30, 41, 55], "intermedi": [4, 5, 35, 55], "easili": [4, 10, 20, 28, 38, 50, 55], "tensor_nam": 4, "tensor_typ": 4, "tensor_t": [4, 41], "1280": [4, 24, 53], "75": [4, 6, 10, 13, 17, 23, 32, 33, 38, 42, 47], "concat1": [4, 26, 27, 30, 33, 41, 42, 51, 53], "sparse_embedding1_train_flow": 4, "fc1_evaluate_flow": 4, "inferencesess": [4, 41], "server": [4, 6, 19, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 35, 37, 43, 48, 53, 54, 55], "tensorflow": [4, 5, 6, 8, 17, 18, 20, 21, 22, 23, 25, 26, 27, 34, 35, 36, 37, 38, 41, 43, 55, 56], "tensorrt": [4, 5, 6, 15, 18, 24, 43, 55], "purpos": [4, 38, 43, 50, 55], "triton": [4, 5, 6, 17, 18, 25, 34, 35, 38, 55], "deriv": [4, 10], "besid": [4, 20, 22, 24, 55], "session": [4, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "model_config_path": 4, "inference_param": 4, "max_batchs": [4, 5, 41], "num_batch": [4, 55], "40000": [4, 24], "40960": [4, 31, 41, 53], "960": 4, "cardin": [4, 51], "suitabl": [4, 5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 40, 42, 45, 53, 55], "model_config": 4, "dcn_dense_1000": 4, "dcn0_sparse_1000": 4, "deployed_devic": [4, 5, 41], "use_gpu_embedding_cach": [4, 5, 41, 55], "cache_size_percentag": [4, 5, 41], "inference_model": [4, 20, 21, 26], "pred": [4, 23, 28, 32, 41], "embed_vec_s": [4, 9, 20, 22, 24, 26, 27, 30, 32, 33], "sparse_embedding1_inference_flow": 4, "acknowledg": 4, "synthet": [4, 30, 31, 41, 45, 46, 55], "num_slot": [4, 31, 41, 55], "paruqet": 4, "test_data": 4, "nnz_arrai": [4, 31, 41], "simul": [4, 55], "dist_typ": [4, 31, 41], "distribution_t": [4, 31, 41], "powerlaw": [4, 19, 31, 41], "power_law_typ": [4, 31, 41], "law": [4, 20, 21, 22, 23, 24, 26, 27, 28, 31, 38, 40, 41, 42, 53, 55], "powerlaw_t": [4, 31, 41], "alpha": [4, 19, 31, 32, 38, 41, 55], "medium": [4, 37, 55], "short": [4, 31, 37, 41, 55], "num_fil": [4, 31, 41], "eval_num_fil": [4, 31, 41], "num_samples_per_fil": [4, 31, 41], "5242880": [4, 53], "1310720": 4, "regard": [4, 5, 6, 55], "data_generator_param": [4, 31, 41], "encapsul": [4, 13, 55], "datasourc": 4, "hugect": 4, "filesystemtype_t": [4, 53], "ip": [4, 5, 25, 29, 30, 34, 43, 47, 48, 53], "cluster": [4, 5, 10, 24, 33, 36, 38, 42, 53, 55, 56], "namenod": [4, 53, 55], "endpoint": [4, 5, 53], "put": [4, 49], "Will": 4, "listen": [4, 5], "huge": 5, "further": [5, 55], "grant": 5, "abil": [5, 18, 55], "perman": 5, "demo": [5, 19, 36, 55], "offer": [5, 18, 55, 56], "superior": 5, "cpu": [5, 6, 8, 10, 18, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 34, 41, 43, 47, 48, 50, 54, 55], "counterpart": [5, 6, 55], "although": [5, 55], "modern": 5, "center": 5, "nvidia": [5, 6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 49, 50, 53, 54, 55], "increas": [5, 30, 54, 55], "ai": [5, 36], "come": [5, 55], "spearhead": 5, "vastli": [5, 55], "clsuter": 5, "ram": [5, 10], "asid": 5, "retain": [5, 55], "hdd": [5, 10], "sdd": [5, 10], "magnitud": [5, 30], "ddr": 5, "hbm": [5, 27, 55], "cost": 5, "throughout": [5, 55], "latenc": [5, 6, 10, 13, 17, 18, 19, 20, 24, 28, 30, 34, 36, 41, 55], "drr": 5, "act": 5, "therebi": 5, "respons": [5, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 42, 53], "redi": [5, 55], "retriev": [5, 9, 10, 13, 17, 20, 24, 26, 28, 36, 55], "rdb": [5, 41], "aof": [5, 41], "seamless": 5, "restart": [5, 41, 46, 47, 48], "particip": 5, "claim": 5, "guarante": [5, 33, 41, 55], "statement": [5, 13, 17, 43], "hiredi": [5, 41], "love": 5, "hear": 5, "experi": [5, 10, 19, 25, 29, 34, 43, 55], "let": [5, 41, 50, 55], "successfulli": [5, 10, 24, 25, 29, 30, 31, 32, 33, 34, 36, 41, 42, 43, 53], "unsuccessfulli": 5, "target": [5, 19, 35, 36, 41, 43, 46, 50, 51, 54, 55], "link": [5, 10, 24, 30, 38, 40, 42, 46, 49, 55], "consid": [5, 20, 21, 26, 36, 49], "compliment": 5, "expand": 5, "capabl": [5, 20, 21, 22, 23, 24, 26, 31, 33, 35, 41, 55, 56], "capac": [5, 18, 36], "entir": [5, 55], "whatev": 5, "reason": [5, 24, 43], "becom": [5, 38, 55], "unavail": [5, 55], "respond": [5, 35], "though": 5, "properti": [5, 50], "emphas": 5, "rough": 5, "guidelin": 5, "often": [5, 44], "ethernet": 5, "rel": 5, "practic": [5, 36], "gb": [5, 25, 29, 34, 40, 41, 42, 43], "few": 5, "tb": [5, 55], "mainten": 5, "stream": [5, 23, 28, 30, 33, 41, 46, 55], "extern": [5, 45, 50], "kafka": [5, 55], "downtim": 5, "retrain": [5, 30], "logic": [5, 9], "whenev": 5, "engin": [5, 6, 17, 18, 24, 34, 42, 50, 52, 55], "associ": [5, 55], "resolv": [5, 31, 40, 41, 42, 51, 53, 55], "turn": [5, 6, 23, 50, 55], "represent": 5, "fill": [5, 40, 41], "publish": [5, 41], "certain": 5, "ingest": [5, 55], "stage": [5, 19, 20, 21, 24, 26, 30, 31, 32, 33, 38, 54, 55], "suffici": [5, 55], "attempt": [5, 30, 31, 32, 33, 55], "minim": [5, 55, 56], "recent": [5, 55], "lru": 5, "volatiledatabaseparam": [5, 41], "persistentdatabaseparam": 5, "updatesourceparam": 5, "These": [5, 10, 13, 17, 26, 33, 38, 44, 55], "packag": [5, 10, 17, 22, 24, 26, 30, 32, 33, 36, 38, 46, 47, 48, 49, 50, 55, 56], "supportlonglong": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "fuse_embedding_t": [5, 23, 28, 30, 33, 55], "volatile_db": [5, 41], "persistent_db": 5, "update_sourc": 5, "At": [5, 40], "origin": [5, 26, 38, 54, 55], "synchron": [5, 19, 30, 35, 55], "plugin": [5, 6, 18, 22, 23, 25, 26, 28, 29, 35, 37, 38, 43, 55], "torch": [5, 17, 18, 29, 32, 41, 47, 48, 55], "describ": [5, 36], "speak": 5, "rare": [5, 40, 55], "might": [5, 30, 32], "sens": 5, "vari": 5, "heterogen": 5, "network_fil": [5, 19], "number_of_refresh_buffers_in_pool": 5, "thread_pool_s": [5, 28, 33], "cache_refresh_percentage_per_iter": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 55], "default_value_for_each_t": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "maxnum_des_feature_per_sampl": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "embedding_cache_typ": [5, 23, 28, 30, 55], "refresh_delai": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "refresh_interv": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "maxnum_catfeature_query_per_table_per_sampl": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "embedding_vecsize_per_t": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "divis": 5, "device_id": [5, 26, 41], "devicelist": 5, "goe": 5, "directli": [5, 20, 21, 24, 26, 27, 33, 38, 41, 47, 55], "uvm": [5, 55], "No": [5, 20, 21, 23, 24, 26, 30, 31, 32, 33, 40], "percentag": [5, 6, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "pool": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "refresh": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "increment": [5, 50, 55], "occur": [5, 31, 55], "frequenc": [5, 30, 55], "volum": 5, "std": [5, 41, 47, 55], "hardware_concurr": [5, 55], "delai": [5, 19], "wait": [5, 28, 30, 35, 41, 45], "timer": [5, 41], "servic": [5, 10, 20, 21, 22, 26, 30, 33, 55], "period": [5, 36], "partit": [5, 50, 55], "use_context_stream": [5, 23, 28, 30, 33], "context": [5, 23, 28, 30, 33, 41], "sparse_fil": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "wdl_infer": [5, 19], "wdl0_sparse_20000": 5, "wdl1_sparse_20000": 5, "dense_fil": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "wdl_dense_20000": 5, "num_of_worker_buffer_in_pool": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "num_of_refresher_buffer_in_pool": [5, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "deployed_device_list": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "max_batch_s": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "table1": [5, 23, 28], "table2": [5, 23, 28], "gpucachep": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "gpucach": [5, 8, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "back": [5, 24, 41, 55], "indvidu": 5, "collabor": 5, "inject": 5, "underli": [5, 10, 13, 17, 38, 55], "redis_clust": [5, 41], "127": [5, 26, 30, 41, 42], "7000": [5, 41, 42], "user_nam": 5, "password": 5, "num_partit": [5, 41], "allocation_r": 5, "268435456": 5, "mib": [5, 30, 31, 32, 33], "shared_memory_s": 5, "17179869184": [5, 41], "gib": [5, 42], "shared_memory_nam": 5, "hctr_mp_hash_map_databas": [5, 41], "shared_memory_auto_remov": [5, 41], "65536": [5, 6, 20, 30, 40], "enable_tl": [5, 41, 55], "tls_ca_certif": [5, 41, 55], "cacertbundl": 5, "crt": [5, 41], "tls_client_certif": [5, 41, 55], "client_cert": 5, "pem": [5, 41], "tls_client_kei": [5, 41, 55], "client_kei": 5, "tls_server_name_identif": [5, 41, 55], "overflow_margin": 5, "overflow_polici": 5, "databaseoverflowpolicy_t": 5, "enum_valu": 5, "overflow_resolution_target": 5, "initialize_after_startup": [5, 41], "initial_cache_r": 5, "cache_missed_embed": 5, "update_filt": 5, "filter": [5, 30], "7003": 5, "7004": 5, "7005": 5, "10000000": [5, 40, 42], "evict_random": 5, "hash_map": 5, "multi_process_hash_map": [5, 41, 55], "live": [5, 24], "dev": [5, 41, 42, 55], "shm": [5, 41, 55], "parallel_hash_map": 5, "degre": 5, "hashmap": [5, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "split": [5, 30, 42, 47, 55], "evenli": 5, "min": [5, 19, 21, 31, 32, 33], "number_of_cpu_cor": 5, "build": [5, 6, 17, 18, 24, 25, 29, 34, 36, 41, 47, 50, 53, 55, 56], "denot": 5, "word": [5, 9, 41], "upper": 5, "bound": 5, "latter": 5, "particularli": [5, 38], "imag": [5, 25, 29, 34, 35, 38, 43, 44, 46, 47, 49, 51, 52], "insuffici": 5, "nativ": [5, 6, 10, 18, 19, 23, 25, 30, 31, 32, 36, 41, 55], "doc": [5, 24, 30, 31, 32, 33, 41, 55], "symbol": [5, 31, 42], "attach": [5, 41], "remov": [5, 35, 40, 41, 50, 55], "disconnect": [5, 41], "program": [5, 30, 31, 32, 33, 41, 43, 55], "pattern": [5, 55], "account": [5, 50], "divid": [5, 9], "num_paritit": 5, "strictli": 5, "incur": [5, 55], "overhead": [5, 6, 22, 30, 55], "too": [5, 41, 50, 55], "5x": [5, 24, 55], "mass": 5, "chunk": [5, 35, 50, 55], "transmiss": 5, "stabil": [5, 30], "1000000": [5, 53], "conjunct": [5, 55], "262143": 5, "18": [5, 19, 23, 30, 32, 33, 41, 47, 51, 53], "lead": [5, 35, 36, 37, 55], "obscur": 5, "therefor": [5, 30, 35, 41, 55], "tl": [5, 55], "ssl": [5, 55], "secur": [5, 50], "encrypt": [5, 41, 55], "slightli": [5, 55], "filesystem": [5, 30, 55], "certif": [5, 41], "ca": [5, 41], "client": [5, 19, 24, 30, 31, 32, 33, 41, 42, 55], "privat": [5, 41], "sni": 5, "instabl": 5, "sporad": 5, "consumpt": [5, 55], "occupi": [5, 24, 30, 33, 42], "ideal": 5, "100000000": [5, 50], "reliabl": [5, 50], "condit": [5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "prune": 5, "conduct": [5, 6, 28, 29, 55], "until": [5, 19, 20, 21, 24, 26, 41, 55], "evict_least_us": 5, "lfu": 5, "effort": [5, 55], "evict_oldest": 5, "complic": [5, 41, 50, 56], "comparison": [5, 54, 55], "faster": [5, 54, 55], "deliv": [5, 55], "evict": [5, 41, 55], "doubl": [5, 9, 41], "fraction": 5, "keep": 5, "exactli": [5, 9, 55], "shrunk": 5, "80": [5, 10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 31, 32, 33, 35, 38, 41, 42, 43, 47], "surpass": 5, "content": [5, 20, 21, 22, 23, 24, 26, 27, 28, 40, 41, 42, 53, 55], "previous": [5, 55], "reconnect": 5, "rocksdb": [5, 55], "materi": [5, 50], "immedi": 5, "upon": [5, 55], "startup": [5, 30, 55], "50": [5, 20, 22, 23, 24, 30, 32, 33, 41, 42], "anoth": [5, 41, 42, 55], "written": [5, 20, 21, 24, 26, 30, 33, 43], "send": [5, 6, 24, 30, 31, 32, 33, 41, 55], "hps_": 5, "databasetype_t": [5, 41], "tmp": [5, 32, 42], "read_onli": 5, "rocks_db": 5, "datatabas": 5, "prevent": [5, 38, 41, 55], "found": [5, 9, 20, 21, 23, 24, 26, 30, 32, 33, 36, 40, 41, 43, 51, 53], "Be": 5, "awar": [5, 31], "overwrit": [5, 22, 23, 24, 26, 30, 33, 40, 51, 53], "driver": [5, 40], "nf": 5, "kept": [5, 6], "sync": 5, "kafka_message_queu": 5, "broker": [5, 55], "metadata_refresh_interval_m": 5, "30000": [5, 20, 21, 24], "poll_timeout_m": 5, "500": [5, 40, 51, 53], "receive_buffer_s": 5, "262144": 5, "8192": [5, 6, 30, 40], "failure_backoff_m": 5, "max_commit_interv": 5, "9092": 5, "null": [5, 15, 41, 55], "semicolon": 5, "delimit": 5, "pair": [5, 38, 42, 51], "topic": [5, 10, 36], "metadata": [5, 35, 45, 46, 50, 55], "download": [5, 19, 30, 35, 40, 42, 44, 46, 49, 52, 55], "send_buffer_s": 5, "kafkamessagesink": 5, "push": 5, "millisecond": [5, 55], "dispatch": [5, 22, 26], "fail": [5, 24, 42], "success": [5, 6, 8, 30, 31, 35, 41, 42, 51, 53], "temporarili": 5, "unreach": 5, "retri": 5, "commit": 5, "independ": [5, 13, 24, 30, 31, 32, 33, 55], "were": [5, 20, 21, 22, 24, 30, 33, 50, 54, 55], "sinc": [5, 23, 24, 30, 31, 32, 33, 36, 38, 40, 41, 55], "create_tf_model": 6, "py": [6, 22, 23, 24, 26, 30, 31, 32, 33, 35, 36, 38, 40, 41, 42, 50, 51, 53, 55], "savedmodel": [6, 8, 21, 25, 26, 30, 33, 55], "16gb": [6, 51, 54], "almost": [6, 20, 21, 24, 26, 54], "furthermor": 6, "create_trt_engin": 6, "summar": [6, 10, 25, 29, 30, 34, 43, 52], "onnx": [6, 17, 43, 55], "surgeri": [6, 17], "experiment": [6, 23, 27, 41, 55], "variablepolici": 6, "save_variable_devic": 6, "common": [6, 24, 26, 27, 36, 53, 54, 56], "baselin": 6, "nn": [6, 9, 10, 12, 20, 21, 22, 24, 28, 30, 32, 33, 47], "lookuplay": [6, 7, 8, 11, 22, 23, 26, 28], "unchang": 6, "integr": [6, 10, 17, 18, 20, 34, 37, 55], "built": [6, 18, 20, 21, 24, 26, 30, 34, 35, 36, 47, 55], "optimum": 6, "131072": 6, "investig": [6, 41], "sxm4": [6, 34], "80gb": [6, 34, 36], "trt": [6, 15, 25, 30, 31, 32, 33, 43, 55], "hps_tensorflow_triton_deployment_demo": [6, 25], "demo_for_tf_trained_model": [6, 34], "repeatedli": [6, 22, 33, 41], "analyz": [6, 30, 55], "serv": [6, 18, 30, 33, 36, 55], "studi": [6, 55], "measur": [6, 30, 50, 55], "perf_analyz": [6, 19, 30], "8000": [6, 24, 30, 31, 32, 33, 42], "categorical_featur": [6, 30, 31, 32, 33], "numerical_featur": [6, 30, 31, 32, 33], "276633": 6, "7912898": 6, "7946796": 6, "7963854": 6, "7971191": 6, "7991237": 6, "7991368": 6, "7998351": 6, "7999728": 6, "8014930": 6, "13554004": 6, "14136456": 6, "14382203": 6, "14382219": 6, "14384425": 6, "14395091": 6, "14395194": 6, "14395215": 6, "14396165": 6, "14671338": 6, "22562171": 6, "25307802": 6, "32394527": 6, "32697105": 6, "32709007": 6, "32709104": 6, "76171875": 6, "806640625": 6, "609375": 6, "04296875": 6, "7919921875": 6, "0986328125": 6, "9453125": [6, 33], "38671875": 6, "3984375": 6, "9462890625": 6, "side": [6, 19, 24, 30, 55], "report": [6, 24, 30, 55], "count": [6, 24, 26, 27, 30, 31, 32, 33, 46], "28589": 6, "avg": [6, 30], "562": [6, 41, 47], "usec": [6, 30, 34], "59": [6, 20, 23, 33, 40, 47, 51, 53, 55], "431": [6, 41], "53": [6, 19, 23, 26, 40, 47, 51, 53], "merlin": [6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 41, 42, 43, 50, 53, 55], "nvcr": [6, 10, 13, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 43, 55], "02": [6, 10, 17, 25, 30, 33, 34, 41, 44, 45, 47, 51, 53], "amd": [6, 34], "epyc": [6, 34], "7742": [6, 34], "processor": [6, 34], "softwar": [6, 10, 13, 17, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 42, 46, 53, 55], "22": [6, 23, 24, 30, 32, 33, 47, 51, 53, 55], "cuda11": 6, "microsecond": 6, "figur": [6, 18], "logarithm": 6, "10x": 6, "speedup": [6, 54, 55], "551": [6, 28, 30, 40], "612": 6, "380": [6, 28, 30, 40, 42], "389": 6, "42": [6, 22, 23, 30, 31, 32, 33, 40, 41, 42, 45, 47, 50, 51], "608": [6, 40, 47, 53], "667": [6, 41, 53], "381": [6, 40], "346": [6, 47], "76": [6, 23, 30, 53], "832": 6, "639": 6, "438": [6, 47], "428": [6, 47], "94": [6, 23, 47], "1911": 6, "849": 6, "604": [6, 47], "534": [6, 40], "58": [6, 23, 30, 33, 42, 47, 51, 53], "4580": 6, "1059": 6, "927": [6, 30, 40], "766": 6, "98": [6, 23, 47, 50], "9872": 6, "1459": 6, "1446": 6, "1114": 6, "86": [6, 23, 24, 26, 40, 41, 47], "19643": 6, "2490": 6, "2432": 6, "1767": 6, "35292": 6, "4131": 6, "4355": 6, "3053": 6, "56": [6, 20, 23, 24, 26, 30, 31, 33, 34, 40, 42, 47, 51, 53], "32768": [6, 30], "54090": 6, "7795": 6, "6816": 6, "5247": 6, "31": [6, 23, 31, 32, 33, 40, 41, 42, 47, 51, 53], "107742": 6, "15036": 6, "13012": 6, "10022": 6, "213990": 6, "29374": 6, "25440": 6, "19340": 6, "06": [6, 13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 38, 40, 41, 42, 43, 44, 47, 51, 53], "init": [7, 8, 10, 19, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 40, 41, 42, 43, 51, 53, 55], "sparselookuplay": [7, 8, 10, 22], "hierarchical_parameter_serv": [8, 9, 10, 20, 21, 22, 23, 24, 26, 27, 28, 55], "kwarg": [8, 9, 20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "abbrevi": [8, 9], "implicitli": [8, 24, 41, 55], "ps_config_fil": [8, 9, 12, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 55], "global_batch_s": [8, 9, 20, 21, 22, 23, 24, 26, 27, 32, 33, 55], "constructor": [8, 9, 24], "safe": [8, 32, 41], "implicit": [8, 9, 24, 25], "especi": [8, 55], "cuda_visible_devic": [8, 20, 21, 22, 23, 24, 26, 28, 32, 33, 42, 55], "set_visible_devic": [8, 27, 55], "addition": [8, 44, 55], "visibl": [8, 55], "horovod": [8, 27, 55], "scope": [8, 22, 32, 55], "hvd": [8, 27], "sess": [8, 41], "hps_init": 8, "keyword": 8, "dictionari": [8, 50], "demo_model": [8, 15], "demo_model_spars": 8, "sparse_embedding0": [8, 21, 22, 26, 31, 32, 33], "demo_model2": 8, "demo_model2_sparse_0": 8, "demo_model2_sparse_1": 8, "ok": [8, 41, 48], "wrapper": [9, 12, 24], "embedding_lookup_spars": [9, 10, 21, 22], "table_id": [9, 12, 15, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40], "emb_vec_s": [9, 12, 15, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33], "emb_vec_dtyp": [9, 20, 21, 22, 23, 24, 26], "sparse_lookup_lay": [9, 21, 22, 26], "def": [9, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 40, 41, 46, 47, 51], "_infer_step": [9, 20, 21, 26], "embedding_vector": [9, 20, 24, 26, 27, 30, 32, 33, 51], "sp_id": [9, 21, 22, 26], "sp_weight": [9, 21, 22, 26], "enumer": [9, 20, 21, 22, 24, 26, 27, 28, 33, 40, 41, 46, 47, 51], "max_norm": [9, 55], "op": [9, 24, 30, 31, 32, 33, 42, 50, 51, 55], "canon": 9, "sparsetensor": [9, 21, 22, 26], "aggreg": 9, "int32": [9, 12, 14, 15, 23, 28, 30, 31, 32, 33], "sqrtn": 9, "squar": 9, "root": [9, 19, 25, 29, 30, 34, 35, 42, 43, 47, 48, 53, 55], "clip": [9, 42, 55], "d0": 9, "d1": 9, "self": [9, 10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 38, 41, 43], "3x16": 9, "vector_for_id_1": 9, "vector_for_id_3": 9, "vector_for_id_0": 9, "rais": [9, 27, 40, 41], "typeerror": 9, "neither": 9, "nor": 9, "valueerror": [9, 27], "lookup_lay": [9, 20, 21, 23, 24], "Its": [9, 55], "get_shap": 9, "realiz": [10, 17, 20, 28, 36], "toolkit": [10, 13, 17, 20, 38], "face": 10, "hundr": 10, "gigabyt": 10, "qualiti": 10, "engag": 10, "dozen": 10, "mitig": 10, "volatil": [10, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 55], "tail": [10, 42, 51, 55], "characterist": [10, 30], "hierarchi": 10, "ssd": [10, 18, 55], "subscrib": [10, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "illustr": [10, 36, 55], "sok": [10, 25, 36, 37, 55, 56], "distributedembed": [10, 26], "dissect": 10, "subgraph": 10, "composid": 10, "saver": [10, 26], "dump_to_fil": [10, 26, 27], "sm": [10, 13, 17, 35, 38], "volta": [10, 13, 17, 36, 38], "70": [10, 13, 17, 19, 23, 32, 35, 38, 40, 43, 47, 53], "ture": [10, 13, 17, 36, 38], "amper": [10, 13, 17, 36, 38, 55], "h100": [10, 13, 17, 34, 35, 38], "hopper": [10, 13, 17, 30, 38, 55], "90": [10, 13, 17, 19, 23, 24, 35, 38, 47, 55], "compon": [10, 13, 17, 19, 35, 38, 55], "applic": [10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 40, 41, 42, 46, 47, 48, 53, 55], "portabl": [10, 13, 17, 30, 38], "reproduc": [10, 13, 17, 25, 29, 33, 34, 38, 43], "agnost": [10, 17, 38], "ll": [10, 35, 38, 40, 50, 55], "pull": [10, 13, 17, 19, 35, 38, 48], "rm": [10, 13, 17, 19, 25, 29, 30, 34, 35, 38, 41, 43, 47, 48, 55], "cap": [10, 13, 17, 19, 25, 29, 34, 38, 40, 43], "sys_nic": [10, 13, 17, 19, 25, 29, 34, 38, 43], "python3": [10, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38, 40, 41, 49], "jupyt": [10, 13, 17, 24, 30, 31, 32, 33, 47, 48, 55], "cover": [10, 30, 41, 46], "migrat": [10, 55], "hps_dlrm_benchmark": [10, 17], "md": [10, 17, 55], "inherit": 12, "modul": [12, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33, 35, 41, 42, 43, 47, 55], "hps_torch": [12, 13, 28, 29], "__init__": [12, 20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33], "har": 13, "seamlessli": [13, 55], "catalog": [13, 17, 38], "explor": 13, "visit": [13, 55], "24": [13, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 38, 40, 41, 42, 43, 47, 51, 53, 54], "hpsplugin": [14, 16], "registr": [14, 15], "hps_trt": [14, 15, 17, 30, 31, 32, 33, 34], "num_keys_per_sampl": 14, "embedding_vector_s": 14, "hpsplugincr": [14, 15, 16], "registri": 14, "trail": 15, "charact": [15, 21, 24, 26], "np": [15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 47, 48, 49, 50, 51], "pluginfield": 15, "hps_conf": 15, "dtype": [15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 41, 42, 49, 50, 55], "string_": 15, "pluginfieldtyp": 15, "popular": [17, 45], "tf2onnx": [17, 30, 33], "hugectr2onnx": [17, 31, 36, 41, 55], "graphsurgeon": 17, "ld_preload": [17, 24, 30, 31, 32, 33], "usr": [17, 19, 22, 24, 26, 30, 31, 32, 33, 35, 41, 43, 49], "lib": [17, 22, 24, 26, 30, 31, 32, 33, 41, 49], "libhps_plugin": [17, 30, 31, 32, 33], "pytorch": [17, 28, 29, 34, 41, 47, 48], "ctype": [17, 30, 31, 32, 33], "cdll": [17, 30, 31, 32, 33], "rtld_global": [17, 30, 31, 32, 33], "subcompon": 18, "meet": [18, 41], "site": 18, "relationship": [18, 55], "highest": 18, "speed": [18, 30, 33, 36, 40, 55], "benefit": 18, "unifi": [18, 49, 55], "extens": [18, 41, 48, 55], "hugectr_backend": 18, "critic": [19, 20, 21, 22, 23, 24, 26, 30, 33, 41], "hps_profil": 19, "benchmark": [19, 34, 41, 54, 55], "trion": 19, "procedur": [19, 55], "embedding_cach": 19, "num_kei": 19, "p": [19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 41, 42, 43, 51, 53, 55], "table_s": 19, "630000": 19, "warmup_iter": 19, "900": [19, 28, 40, 41, 51, 53], "000285m": 19, "000384853m": 19, "median": 19, "000365m": 19, "95": [19, 23, 47], "000428m": 19, "99": [19, 23, 47], "000465m": 19, "009736m": 19, "73973e": 19, "010842m": 19, "0117076m": 19, "011596m": 19, "012219m": 19, "016642m": 19, "027379m": 19, "86236": 19, "dedupl": 19, "019159m": 19, "0272492m": 19, "027262m": 19, "028104m": 19, "029548m": 19, "052309m": 19, "36681": 19, "178875m": 19, "231377m": 19, "227815m": 19, "267493m": 19, "284738m": 19, "47672m": 19, "4389": 19, "merg": [19, 30, 35], "007656m": 19, "00850756m": 19, "008434m": 19, "009117m": 19, "011863m": 19, "018697m": 19, "118568": 19, "105163m": 19, "15741m": 19, "153763m": 19, "192302m": 19, "208846m": 19, "402043m": 19, "6503": 19, "52": [19, 23, 31, 40, 41, 47, 51, 53, 55], "021729m": 19, "0227739m": 19, "02253m": 19, "023695m": 19, "025035m": 19, "043024m": 19, "44385": 19, "decompress": 19, "deuniqu": 19, "011247m": 19, "0121274m": 19, "011953m": 19, "013055m": 19, "014706m": 19, "022186m": 19, "83661": 19, "719323": 19, "843972": 19, "854749": 19, "894188": 19, "90276": 19, "918169": 19, "parti": [19, 35, 43, 55], "git": [19, 25, 29, 30, 34, 35, 43, 47, 53], "clone": [19, 30, 35, 47, 53, 55], "cd": [19, 25, 29, 30, 34, 35, 38, 40, 41, 43, 47, 48, 53], "submodul": [19, 35, 43, 53], "recurs": [19, 35, 43, 53], "ngc": [19, 36, 47, 49, 53, 55], "mount": [19, 25, 29, 34, 43, 47], "pwd": [19, 25, 29, 30, 34, 41, 43, 47, 48], "8888": [19, 25, 29, 30, 34, 43], "mkdir": [19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 43, 46, 51, 53], "cmake": [19, 35, 36, 43, 50, 53, 55], "dcmake_build_typ": [19, 35, 43, 53], "dsm": [19, 35, 43, 53, 55], "denable_infer": [19, 30, 35], "ON": [19, 30, 35, 36, 43, 53, 55], "denable_profil": 19, "j": [19, 21, 22, 26, 32, 33, 35, 43, 53], "exit": [19, 41], "hotkei": 19, "histogram": 19, "100000": [19, 22], "hot_key_percentag": 19, "hot_key_coverag": 19, "test": [19, 30, 35, 41, 42, 45, 53, 54, 55], "discard": 19, "database_backend": [19, 55], "vdb": 19, "pdb": 19, "refresh_embeddingcach": 19, "lookup_sess": 19, "e2": 19, "model_sampl": 19, "190813m": 19, "243117m": 19, "238085m": 19, "283761m": 19, "346377m": 19, "511712m": 19, "4200": [19, 51], "075086m": 19, "127312m": 19, "121235m": 19, "166826m": 19, "219295m": 19, "285409m": 19, "8248": 19, "44": [19, 23, 26, 30, 32, 33, 40, 41, 47, 51, 53], "xx": [19, 55], "mutual": [19, 30], "accur": 19, "don": [19, 35, 55], "prepar": [19, 38, 50, 51, 55], "everyth": [19, 55], "tritonserv": [19, 24, 30, 31, 32, 33], "your_model_nam": 19, "perf_output": 19, "csv": [19, 45, 46, 49, 50], "verbos": [19, 24, 30, 32, 35, 55], "your_generated_request": 19, "pipelin": [19, 36, 54, 55], "pofil": 19, "copyright": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "2021": [20, 21, 22, 23, 24, 26, 27, 28, 37, 40, 42, 53], "corpor": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "right": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "licens": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "complianc": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "www": [20, 21, 22, 23, 24, 26, 27, 28, 33, 40, 42, 53], "org": [20, 21, 22, 23, 24, 26, 27, 28, 33, 38, 40, 42, 45, 48, 49, 53, 55], "agre": [20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 41, 42, 53], "AS": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "warranti": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "OR": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 54], "OF": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "languag": [20, 21, 22, 23, 24, 26, 27, 28, 37, 40, 42, 53], "govern": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53], "permiss": [20, 21, 22, 23, 24, 26, 27, 28, 35, 40, 42, 53], "intend": [20, 21, 22, 23, 24, 26, 27, 28, 40, 42, 53, 55], "preinstal": [20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 53], "naiv": [20, 23], "neural": [20, 21, 22, 23, 24, 26, 30, 36, 38, 41, 50, 51], "gpu_num": [20, 21, 22, 24, 26, 27, 32, 33], "iter_num": [20, 21, 22, 24, 26, 27, 32, 33], "vocabulary_range_per_slot": [20, 21, 22, 24, 26, 27, 32, 33], "naive_dnn": 20, "dense_model_path": [20, 21, 22, 24, 26, 27], "naive_dnn_dens": 20, "embedding_table_path": [20, 21, 22, 24, 26, 27, 32, 33], "naive_dnn_spars": 20, "saved_path": [20, 21, 22, 24, 26, 27, 33], "naive_dnn_tf_saved_model": 20, "np_key_typ": [20, 21, 22, 24, 26, 27, 32, 33], "np_vector_typ": [20, 21, 22, 24, 26, 27, 32, 33], "tf_key_typ": [20, 21, 22, 23, 24, 26, 27, 33], "tf_vector_typ": [20, 21, 22, 24, 26, 27, 33], "join": [20, 21, 22, 23, 24, 26, 28, 30, 32, 33, 41, 42, 45, 46, 50, 51], "generate_random_sampl": [20, 21, 22, 24, 26, 27, 32, 33], "key_dtyp": [20, 21, 22, 24, 26, 32, 33], "vocab_rang": [20, 21, 22, 23, 24, 26, 28, 32, 33], "keys_per_slot": [20, 21, 24, 32, 33], "randint": [20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33], "tf_dataset": [20, 21, 22, 24, 26, 27, 33], "from_tensor_slic": [20, 21, 22, 24, 26, 27, 33], "drop_remaind": [20, 21, 22, 24, 26, 27, 33], "trainmodel": [20, 21, 24], "init_tensor": [20, 22, 24, 26, 30, 32, 33], "super": [20, 21, 22, 23, 24, 26, 27, 28, 30, 32, 33], "initial_valu": [20, 21, 22, 24, 30, 33], "fc_1": [20, 21, 24], "kernel_initi": [20, 21, 23, 24], "ones": [20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "bias_initi": [20, 21, 23, 24], "fc_2": [20, 21, 24], "logit": [20, 21, 22, 23, 24, 26, 27, 30, 32, 33], "learning_r": [20, 21, 22, 24, 26, 27, 33, 36], "loss_fn": [20, 21, 22, 24, 26, 27, 33], "binarycrossentropi": [20, 21, 22, 24, 26, 27, 33], "from_logit": [20, 21, 22, 24, 26], "_train_step": [20, 21, 22, 24, 26, 27, 33], "gradienttap": [20, 21, 22, 24, 26, 27, 33], "tape": [20, 21, 22, 24, 26, 27, 33], "grad": [20, 21, 22, 24, 26, 33], "trainable_vari": [20, 21, 22, 24, 26, 27, 33], "apply_gradi": [20, 21, 22, 24, 26, 27, 33], "zip": [20, 21, 22, 24, 26, 27, 33, 45, 46], "id_tensor": 20, "trained_model": [20, 21, 22, 24, 26, 27, 32, 33], "weights_list": [20, 21, 22, 24, 33], "get_weight": [20, 21, 22, 24, 33], "embedding_weight": [20, 22, 24, 32, 33], "dense_model": [20, 21, 24, 26, 27, 31, 41], "get_lay": [20, 21, 24, 26, 27], "2022": [20, 21, 22, 24, 26, 27, 31, 37, 40, 53, 55], "07": [20, 21, 22, 23, 26, 27, 32, 33, 40, 41, 42, 44, 47, 51, 53], "742983": 20, "platform": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 34, 37, 41, 55], "cpu_feature_guard": [20, 21, 22, 23, 24, 26, 30, 33, 41], "cc": [20, 21, 22, 23, 24, 26, 27, 30, 33, 41], "151": [20, 21, 22, 26], "oneapi": [20, 21, 22, 23, 24, 26, 30], "onednn": [20, 21, 22, 23, 24, 26, 30], "avx2": [20, 21, 22, 26, 41], "fma": [20, 21, 22, 26, 41], "rebuild": [20, 21, 22, 23, 24, 26, 30, 33, 41, 55], "appropri": [20, 21, 22, 23, 24, 26, 30, 33, 41], "present": [20, 21, 22, 24, 30, 33], "track": [20, 21, 22, 24, 30, 33, 41], "strong": [20, 21, 22, 24, 30, 33], "rewritten": [20, 21, 22, 24, 30, 33], "subclass": [20, 21, 22, 24, 30, 33], "_________________________________________________________________": [20, 21, 26], "input_1": [20, 21, 22, 23, 24, 26], "inputlay": [20, 21, 22, 23, 24, 26, 30, 33], "embedding_l": 20, "ookup": 20, "tfoplambda": [20, 21, 22, 23, 24, 26, 30, 33], "48": [20, 21, 23, 26, 30, 32, 33, 40, 41, 47, 51], "12544": [20, 21], "257": [20, 21, 22, 24, 26, 30], "801": [20, 40], "trainabl": [20, 21, 22, 23, 24, 26, 30, 31, 33, 40, 41, 42, 44, 53], "57": [20, 22, 23, 30, 33, 40, 42, 47, 51, 53], "326494": 20, "common_runtim": [20, 21, 22, 23, 24, 26, 33, 41], "gpu_devic": [20, 21, 22, 23, 24, 26, 33, 41], "1525": [20, 21, 22, 26], "replica": [20, 21, 22, 23, 24, 26, 33, 41], "30989": [20, 21, 22, 26], "mb": [20, 21, 22, 23, 24, 26, 33, 41, 50], "tesla": [20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 51, 53], "sxm2": [20, 21, 22, 23, 24, 25, 26, 29, 31, 33, 34, 40, 41, 42, 43, 51, 53], "bu": [20, 21, 22, 23, 24, 26, 33, 40, 41], "0000": [20, 21, 22, 23, 24, 26, 33, 40, 41, 42], "00": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 40, 41, 47, 48, 51, 53], "6136": 20, "6875": 20, "4463": 20, "05712890625": 20, "3192": 20, "029296875": 20, "2180": 20, "40283203125": 20, "1419": 20, "980712890625": 20, "879": [20, 40, 42], "0396728515625": 20, "513": [20, 42], "3021240234375": 20, "272": [20, 31, 41], "9712219238281": 20, "129": 20, "147705078125": 20, "21624755859375": 20, "model_1": [20, 21, 22, 24, 26, 30], "input_2": [20, 21, 22, 23, 24, 26], "compile_metr": [20, 21, 24, 26], "645703": 20, "368": [20, 21, 26, 28, 33, 40, 41], "asset": [20, 21, 24, 26, 30, 33], "readi": [20, 21, 24, 26, 30, 31, 32, 33, 40, 49, 53], "load_model": [20, 21, 23, 24, 26], "create_and_save_inference_graph": [20, 21, 24, 26], "convert_to_sparse_model": [20, 21, 22, 24, 32, 33], "embeddings_weight": [20, 21, 22, 24, 32, 33], "wb": [20, 21, 22, 23, 24, 28, 30, 31, 32, 33, 46, 47, 48, 51], "key_fil": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec_fil": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec": [20, 21, 22, 23, 24, 28, 32, 33, 51], "key_struct": [20, 21, 22, 23, 24, 28, 32, 33, 51], "vec_struct": [20, 21, 22, 23, 24, 28, 32, 33, 51], "wa": [20, 21, 22, 23, 24, 26, 30, 35, 36, 40, 42, 43, 50, 53, 54, 55], "model_2": [20, 21, 24], "input_3": [20, 21, 22, 23, 24, 26], "reshape_1": [20, 21, 22, 23, 24], "12801": 20, "necessari": [20, 21, 26, 30, 35, 55], "peek": [20, 21, 26], "writefil": [20, 21, 22, 23, 24, 26, 30, 31, 32, 33, 40, 41, 42, 51, 53], "inference_with_saved_model": [20, 21, 26], "embedding_vectors_peek": 20, "id_tensors_peek": 20, "pars": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 55], "hctr": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 53, 55], "25": [20, 21, 23, 28, 32, 33, 40, 42, 47, 50, 51, 53], "009": [20, 40], "rk0": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 53, 55], "main": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 35, 40, 41, 42, 50, 53, 55], "010": [20, 40, 53], "db": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41, 55], "357": 20, "hps_et": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 41], "preallocatedhashmapbackend": [20, 21, 22, 26], "18446744073709551615": [20, 21, 22, 23, 24, 26, 31, 32, 33, 41], "363": [20, 40, 47], "000000": [20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 40, 41, 42, 49, 51, 53], "405": 20, "23265739": 20, "11092357": 20, "09594781": 20, "16974597": 20, "22555737": 20, "20454781": 20, "22397298": 20, "1229516": 20, "12451896": 20, "21348731": 20, "11943579": 20, "2502464": 20, "5283": 20, "17773": 20, "26371": 20, "5043": 20, "17928": 20, "22941": 20, "5154": 20, "18816": 20, "28670": 20, "9014": 20, "16185": 20, "22256": 20, "9893": 20, "14515": 20, "25771": 20, "5377": 20, "18265": 20, "28063": 20, "hierarchical_parameter_server_demo": [21, 22, 23, 24, 25, 26, 27], "dive": [21, 22, 23, 24, 26, 27, 37], "slot_num_per_t": 21, "embed_vec_size_per_t": 21, "max_vocabulary_size_per_t": 21, "vocabulary_range_per_slot_per_t": 21, "max_nnz_per_slot_per_t": 21, "multi_table_sparse_input_dens": 21, "multi_table_sparse_input": 21, "multi_table_sparse_input_sparse_0": 21, "multi_table_sparse_input_sparse_1": 21, "multi_table_sparse_input_tf_saved_model": 21, "generate_sparse_kei": [21, 22, 26], "max_nnz_per_slot": 21, "max_nnz_of_all_slot": 21, "max_nnz": [21, 22, 26, 27, 55], "sort": [21, 22, 26, 41, 46, 50], "choic": [21, 22, 26, 40], "dense_shap": [21, 22, 26], "generate_dense_kei": 21, "dense_kei": 21, "assert": [21, 23, 28, 47, 55], "sparse_kei": [21, 22, 26, 27], "init_tensors_per_t": 21, "max_nnz_of_all_slots_per_t": 21, "el": 21, "params0": 21, "params1": 21, "input_shap": 21, "fc_3": 21, "embeddings0": 21, "embeddings1": 21, "math": [21, 30, 55], "embedding_weights_per_t": 21, "51": [21, 23, 40, 41, 42, 47, 51, 53], "09": [21, 30, 41, 42, 47, 51, 53], "676041": 21, "271131": 21, "__________________________________________________________________________________________________": [21, 22, 23, 24, 26, 30, 33], "embedding_look": [21, 22, 24, 30, 33], "up_spars": [21, 22], "embedding_looku": [21, 22, 24, 30, 33], "p_spars": [21, 22], "16640": 21, "29": [21, 22, 23, 26, 27, 30, 32, 33, 40, 41, 42, 47, 51, 53], "441": [21, 41, 47], "14588": 21, "11693": 21, "8232": 21, "9658203125": 21, "6276": 21, "9736328125": 21, "4676": 21, "82861328125": 21, "2921": 21, "1875": 21, "1938": 21, "2447509765625": 21, "1093": 21, "598388671875": 21, "616": 21, "3092651367188": 21, "61248779296875": 21, "input_4": [21, 22, 23, 24], "335404": 21, "absl": [21, 24, 26, 33], "_wrapped_model": [21, 24, 26], "args_0": [21, 24, 26], "unsupport": [21, 24, 26], "renam": [21, 24, 26, 50, 55], "args_0_1": [21, 24, 26], "input_5": [21, 23, 24], "input_6": [21, 23, 24], "sparseloo": [21, 22, 26], "kuplay": [21, 22, 26], "reshape_2": [21, 23], "reshape_3": [21, 23], "29441": 21, "args_0_3": [21, 26], "embeddings0_peek": 21, "embeddings1_peek": 21, "inputs_peek": [21, 26], "2nd": [21, 40], "495": 21, "855": [21, 47], "33": [21, 23, 26, 30, 31, 32, 33, 40, 42, 47, 51, 53], "195": [21, 30, 47], "201": [21, 47, 53], "212": [21, 28, 41], "9905": 21, "1750": 21, "4223": 21, "20477": 21, "22119": 21, "23797": 21, "6111": 21, "9122444": 21, "76979905": 21, "7415885": 21, "66938084": 21, "90488005": 21, "7773342": 21, "6368773": 21, "276": [21, 47], "1610": 21, "408": [21, 30, 32, 40, 42, 53], "1884": 21, "678": [21, 28, 47], "1762": 21, "369": [21, 40], "1794": 21, "403": 21, "1216": 21, "909": 21, "1427": 21, "28882617": 21, "41947648": 21, "597903": 21, "37505823": 21, "70420146": 21, "38864705": 21, "32224336": 21, "31987724": 21, "43596342": 21, "5383081": 21, "37384593": 21, "6026224": 21, "dnn_dens": 22, "dnn_spars": 22, "dnn_tf_saved_model": 22, "dense_featur": [22, 24, 26, 27], "astyp": [22, 23, 24, 26, 27, 28, 31, 32, 33, 42, 50], "fc3": [22, 30, 40, 42, 51, 53], "input_cat": [22, 26], "input_dens": [22, 26, 27], "concat_fea": 22, "mirroredstrategi": [22, 55], "_replica_loss": 22, "compute_average_loss": 22, "_reshape_input": 22, "_dataset_fn": 22, "input_context": 22, "replica_batch_s": 22, "get_per_replica_batch_s": 22, "num_input_pipelin": 22, "input_pipeline_id": 22, "distribute_datasets_from_funct": 22, "41": [22, 23, 30, 32, 33, 40, 41, 47, 48, 51, 53], "55": [22, 23, 30, 33, 41, 42, 47, 51, 53], "554588": 22, "606412": 22, "608128": 22, "609468": 22, "0a": [22, 40, 41], "610818": 22, "0b": [22, 40, 41], "160": [22, 31, 47, 51], "170": [22, 31, 32], "175104": 22, "262400": [22, 30], "437": [22, 28, 31, 41, 47], "761": [22, 30], "eagerli": 22, "call_for_each_replica": 22, "experimental_run": 22, "dist": [22, 24, 26, 32, 49], "1082": [22, 26, 40], "userwarn": [22, 26, 42, 50], "binary_crossentropi": [22, 26], "dispatch_target": [22, 26], "batch_all_reduc": 22, "num_pack": 22, "allreduc": 22, "indexedslic": 22, "broadcast": 22, "perreplica": 22, "1950232": 22, "20766959": 22, "2006835": 22, "21188965": 22, "681": [22, 31, 47], "73474": 22, "691": 22, "33826": 22, "588": [22, 40, 42], "15265": 22, "622": [22, 47], "72485": 22, "9260483": 22, "509967": 22, "0374002": 22, "1059036": 22, "002458": 22, "7079678": 22, "333396": 22, "6451607": 22, "_apply_all_reduc": 22, "_all_reduc": 22, "0x7fba4c2dc1f0": 22, "retrac": [22, 33], "trace": [22, 32, 33, 55], "expens": [22, 33], "excess": [22, 33], "pass": [22, 30, 31, 32, 33, 41, 47, 55], "instead": [22, 24, 33, 38, 41, 55], "outsid": [22, 33, 55], "experimental_relax_shap": 22, "relax": 22, "unnecessari": [22, 33, 55], "controlling_retrac": [22, 33], "api_doc": [22, 33], "8326673": 22, "79405844": 22, "85364443": 22, "92679256": 22, "0x7fba4c2dcdc0": 22, "5796976": 22, "54752666": 22, "57471323": 22, "54845804": 22, "61678064": 22, "647662": 22, "6421599": 22, "6278339": 22, "28049487": 22, "2768654": 22, "2943622": 22, "2805586": 22, "2102679": 22, "368755": 22, "4997649": 22, "5143406": 22, "413176": 22, "42411563": 22, "38453132": 22, "4314984": 22, "pretrainedembed": 22, "fc": [22, 23, 47, 54], "new_fc": 22, "train_with_pretrained_embed": 22, "707": [22, 47], "17": [22, 23, 26, 27, 32, 33, 41, 47, 51, 53, 55], "153": 22, "177": [22, 30, 33], "180": [22, 33], "188": [22, 31, 42], "191": [22, 47, 53], "197": 22, "concat_1": [22, 32], "171": [22, 30, 31, 41], "17934436": 22, "17969523": 22, "18917403": 22, "18102707": 22, "7858478": 22, "68311": 22, "66279": 22, "5826445": 22, "7325904": 22, "7331751": 22, "7210605": 22, "7671325": 22, "62144834": 22, "5696643": 22, "5946336": 22, "64713424": 22, "88115656": 22, "9079187": 22, "98161024": 22, "97925556": 22, "6572284": 22, "6304919": 22, "66552734": 22, "6695935": 22, "2002374": 22, "19162768": 22, "1874283": 22, "19209734": 22, "5284709": 22, "6028371": 22, "5635803": 22, "5773235": 22, "74001855": 22, "71915305": 22, "619328": 22, "7890761": 22, "55197906": 22, "5565746": 22, "52792": 22, "6230979": 22, "templat": [23, 38], "emebed": 23, "off": [23, 35, 40, 55], "create_model_for_table_fus": 23, "pytest": [23, 28], "vocab_s": [23, 28], "num_query_kei": [23, 28], "num_it": [23, 28], "list_physical_devic": [23, 27], "set_memory_growth": [23, 27], "set_inter_op_parallelism_thread": 23, "hps_config": [23, 28], "_tabl": [23, 28], "generate_embedding_t": [23, 28], "hugectr_sparse_model": [23, 28, 51], "00025": 23, "set_up_model_fil": [23, 28], "table_nam": [23, 27, 28, 55], "model_file_nam": [23, 28], "concat_embed": 23, "create_savedmodel": 23, "hps_config_json_object": [23, 28], "indent": [23, 28], "outfil": [23, 28], "__name__": [23, 30, 41], "__main__": [23, 30, 32, 41], "2023": [23, 30, 32, 33, 40, 41, 42, 55], "03": [23, 30, 32, 33, 40, 42, 44, 47, 49, 50, 51, 53], "28": [23, 24, 30, 32, 33, 40, 42, 47, 51, 53], "206281": 23, "194": [23, 24, 28, 30], "sse3": [23, 24, 26, 30, 33], "sse4": [23, 24, 26, 30, 33], "avx": [23, 24, 26, 30, 33], "36": [23, 24, 30, 31, 32, 33, 40, 47, 51, 53], "420084": 23, "926162": 23, "1637": 23, "30996": 23, "input_7": [23, 24], "input_8": 23, "embedding_lookup0": 23, "embedding_lookup1": 23, "embedding_lookup2": 23, "embedding_lookup3": 23, "embedding_lookup4": 23, "embedding_lookup5": 23, "embedding_lookup6": 23, "embedding_lookup7": 23, "3328": [23, 32], "reshape_4": 23, "reshape_5": 23, "reshape_6": 23, "reshape_7": 23, "26624": 23, "26625": 23, "625": 23, "38": [23, 30, 31, 32, 33, 41, 47, 51, 53], "079": 23, "use_static_t": [23, 28, 30, 31, 32, 33], "8_tabl": [23, 28], "080": [23, 40], "blank": [23, 24, 28, 30, 31, 32, 33, 41], "547": [23, 40, 47], "table0": [23, 28], "hashmapbackend": [23, 24, 31, 32, 33, 41], "39": [23, 26, 32, 33, 40, 47, 51, 53, 54], "379": [23, 40, 42, 47], "830": 23, "40": [23, 30, 32, 33, 40, 41, 42, 47, 51, 53], "448": 23, "table3": [23, 28], "899": [23, 40, 45], "table4": [23, 28], "934": [23, 40], "table5": [23, 28], "43": [23, 26, 32, 33, 41, 47, 48, 53], "097": [23, 30, 40, 42], "table6": [23, 28], "296": [23, 28, 41, 45, 55], "table7": [23, 28], "297": [23, 47], "306": [23, 45, 53], "469": 23, "470": [23, 47], "ec": [23, 24, 28, 30, 31, 32, 33, 55], "475": [23, 28, 47], "lookupsess": [23, 28, 30, 33, 41], "inputs_seq": [23, 28], "elaps": [23, 28], "918038": 23, "325440": 23, "818316": 23, "756": [23, 28, 40], "hps_database_backend": [23, 28], "html": [23, 24, 28, 30, 31, 32, 33, 41, 48, 50, 55], "292": [23, 40, 53], "fused_embedding0": [23, 28], "80000": 23, "299": [23, 26, 31, 40], "406": [23, 40, 47], "407": [23, 40, 41, 47, 53], "14": [23, 24, 30, 31, 32, 33, 40, 41, 42, 47, 49, 51, 53], "19": [23, 32, 33, 40, 41, 42, 47, 51, 53], "21": [23, 30, 32, 33, 41, 47, 49, 51, 53], "27": [23, 26, 30, 31, 32, 33, 40, 41, 42, 47, 51, 53], "30": [23, 26, 32, 33, 40, 41, 47, 50, 51, 53, 55], "35": [23, 31, 32, 33, 40, 47, 51, 53], "37": [23, 24, 30, 31, 32, 33, 40, 41, 42, 47, 53], "46": [23, 31, 32, 33, 40, 41, 42, 47, 51], "47": [23, 31, 32, 33, 41, 47, 51], "54": [23, 30, 31, 32, 40, 41, 42, 47, 51, 53], "60": [23, 26, 27, 35, 38, 47, 53], "62": [23, 42, 45, 47], "63": [23, 31, 47, 53], "65": [23, 47], "66": [23, 24, 47], "68": [23, 47, 50], "69": [23, 47], "73": [23, 26, 30, 32, 47], "74": [23, 30, 47], "77": [23, 40, 42, 47], "78": [23, 47], "79": [23, 42, 47], "81": [23, 47], "82": [23, 47], "83": [23, 40, 47], "84": [23, 26, 40, 47], "85": [23, 24, 26, 30, 40, 41, 47], "87": [23, 47], "88": [23, 47], "89": [23, 24, 40, 41, 47], "91": [23, 42, 47], "92": [23, 30, 47], "93": [23, 47], "96": [23, 47], "97": [23, 42, 47], "9442901611328125": 23, "hps_tf_triton_dens": 24, "hps_tf_triton": 24, "hps_tf_triton_sparse_0": 24, "hps_tf_triton_tf_saved_model": 24, "requestsdependencywarn": 24, "urllib3": 24, "chardet": 24, "doesn": [24, 42, 55], "concated_featur": 24, "919938": 24, "444040": 24, "1532": 24, "30991": 24, "23296": 24, "553": [24, 30, 40, 47], "10934": 24, "333984375": 24, "9218": 24, "0703125": 24, "7060": 24, "255859375": [24, 33], "5094": 24, "876953125": 24, "3605": 24, "475830078125": 24, "2593": 24, "270751953125": 24, "1741": 24, "0677490234375": 24, "1045": 24, "5091552734375": 24, "541": [24, 30, 40, 47], "4227905273438": 24, "242": [24, 47], "8596649169922": 24, "hps_tf": [24, 25], "model_repo": [24, 30, 31, 32, 33], "triton_model_repo": 24, "23553": 24, "pbtxt": [24, 30, 31, 32, 33], "mv": [24, 26, 27, 30, 31, 32, 33], "tensorflow_savedmodel": 24, "data_typ": [24, 30, 31, 32, 33], "type_int64": 24, "type_fp32": [24, 30, 31, 32, 33], "output_1": [24, 30, 33], "version_polici": 24, "instance_group": [24, 30, 31, 32, 33], "kind_gpu": [24, 30, 31, 32, 33], "tree": [24, 30, 31, 32, 33, 50, 55], "34mmodel_repo": [24, 31, 32, 33], "00m": [24, 31, 32], "34m1": [24, 31, 32, 33], "34mmodel": 24, "34masset": 24, "keras_metadata": 24, "pb": 24, "saved_model": [24, 30, 33], "34mvariabl": 24, "00000": 24, "34mhps_tf_triton_sparse_0": 24, "background": [24, 30, 31, 32, 33, 41, 55], "merlin_hp": 24, "py3": 24, "x86_64": [24, 31, 41], "egg": 24, "libhierarchical_parameter_serv": 24, "curl": 24, "format_non": 24, "is_shape_tensor": 24, "allow_ragged_batch": 24, "label_filenam": 24, "batch_input": 24, "batch_output": 24, "prioriti": [24, 54], "priority_default": 24, "input_pinned_memori": 24, "output_pinned_memori": 24, "gather_kernel_buffer_threshold": 24, "eager_batch": 24, "dynamic_batch": 24, "preferred_batch_s": 24, "max_queue_delay_microsecond": 24, "preserve_ord": 24, "priority_level": 24, "default_priority_level": 24, "priority_queue_polici": 24, "hps_tf_triton_0": 24, "secondary_devic": 24, "profil": [24, 30, 31, 32, 33, 44, 55], "passiv": 24, "host_polici": 24, "default_model_filenam": [24, 30, 31, 32, 33], "cc_model_filenam": 24, "metric_tag": 24, "model_warmup": 24, "tritoncli": [24, 31, 32, 33], "httpclient": [24, 31, 32, 33], "send_inference_request": 24, "num_request": 24, "triton_cli": 24, "inferenceservercli": [24, 31, 32, 33], "is_server_l": 24, "get_model_repository_index": 24, "key_tensor": [24, 41], "dense_tensor": 24, "inferinput": [24, 31, 32, 33], "np_to_triton_dtyp": [24, 31, 32, 33], "set_data_from_numpi": [24, 31, 32, 33], "inferrequestedoutput": [24, 31, 32, 33], "get_respons": [24, 31, 32, 33], "health": 24, "httpsocketpoolrespons": 24, "plain": 24, "post": [24, 54], "bytearrai": 24, "model_vers": [24, 31, 32, 33], "binary_data_s": [24, 31, 32, 33], "fall": 24, "trt_convert": 24, "original_model_path": 24, "new_model_path": 24, "instanti": [24, 50], "trtgraphconverterv2": 24, "input_saved_model_dir": 24, "precision_mod": 24, "trtprecisionmod": 24, "trt_func": 24, "convert_to_tensor": [24, 27], "input_fn": 24, "yield": 24, "output_saved_model_dir": 24, "clear": [24, 30, 32, 33, 50], "prior": [24, 30, 33], "924379": 24, "grappler": 24, "elig": 24, "924537": 24, "single_machin": 24, "928272": 24, "deactiv": 24, "028482": 24, "028568": 24, "061909": 24, "068593": 24, "tf2tensorrt": 24, "trt_optimization_pass": 24, "198": 24, "calibr": 24, "use_calibr": 24, "069761": 24, "952": [24, 40], "noop": 24, "1x": 24, "nonconvert": 24, "deeplearn": 24, "069860": 24, "tf_trt_max_allowed_engin": 24, "minimum_segment_s": 24, "069893": 24, "convert_graph": 24, "799": [24, 30, 40, 47], "candid": 24, "060667": 24, "916": [24, 40], "trtengineop_000_000": 24, "trtengineop": 24, "biasadd": 24, "concatv2": 24, "const": [24, 30, 33, 41], "matmul": [24, 26, 27, 32, 33], "329": [24, 41, 47, 53], "745": [24, 33, 40], "753": [24, 41, 47], "200000": [24, 31, 32, 33], "778": [24, 47], "814": [24, 31, 47], "815": 24, "818078": 24, "104": [24, 28, 42, 47], "818150": 24, "106": [24, 30, 41], "749149": 24, "convert_nod": 24, "1275": 24, "814132": 24, "trt_logger": [24, 30, 31, 32, 33], "defaultlogg": 24, "cpp": [24, 30, 31, 32, 33, 41, 55], "cublaswrapp": 24, "cubla": [24, 30, 31, 32, 33], "817575": 24, "trt_engine_op": 24, "1061": [24, 33], "creation": 24, "817694": 24, "894": [24, 41], "823806": 24, "34m2": 24, "serial": 24, "numba": [24, 30, 33, 42], "select_devic": [24, 30, 33], "close": [24, 30, 33], "rememb": [24, 30, 35], "kill": 24, "again": [24, 30, 55], "simplest": [25, 29, 34, 43], "isol": [25, 29, 34, 43], "repetit": [25, 29, 34, 43], "prefer": [25, 28, 29, 34], "notebookapp": [25, 29, 34, 43, 48], "token": [25, 29, 34, 43, 48], "web": [25, 29, 30, 34, 37, 43, 55], "browser": [25, 29, 30, 34, 43], "aae96ae9387cd28151868fee318c3b3581a2d794f3b25c6b": [25, 29, 34, 43], "hps_multi_table_sparse_input_demo": 25, "hps_pretrained_model_training_demo": 25, "mirror": [25, 55], "sok_to_hps_dlrm_demo": 25, "sparseoperationkit": [25, 26, 27, 55], "hps_table_fusion_demo": 25, "author": [25, 29, 34, 37, 41, 43], "intel": [25, 29, 34, 43, 54], "xeon": [25, 29, 34, 43, 54], "e5": [25, 29, 34, 43, 54], "2698": [25, 29, 34, 43, 54], "v4": [25, 29, 34, 43, 54, 55], "20ghz": [25, 29, 34, 43, 54], "kingslei": [25, 29, 34, 37, 43], "liu": [25, 29, 34, 37, 43], "hierarchicalparameterserv": [26, 27], "sparse_operation_kit_demo": [26, 27, 55], "sparse_operation_kit": [26, 27, 35, 43, 55], "sy": [26, 27, 30, 33, 41, 42, 47, 50], "unit_test": 26, "test_script": 26, "tf2": 26, "260000": [26, 27, 31, 32, 33], "dlrm_dens": [26, 27], "dlrm_spars": [26, 27, 30], "dlrm_tf_saved_model": [26, 27, 33], "plugin_adam": 26, "arch": [26, 27, 32, 33], "out_activ": [26, 27, 32, 33], "secondorderfeatureinteract": [26, 27, 32, 33], "self_interact": [26, 27], "dot_product": [26, 27, 32, 33], "transpose_b": [26, 27, 33], "ones_lik": [26, 27], "linalg": [26, 27], "band_part": [26, 27], "flat_interact": [26, 27, 32, 33], "boolean_mask": [26, 27], "max_vocabulary_size_per_gpu": [26, 55], "arch_bot": [26, 27, 32, 33], "arch_top": [26, 27, 32, 33], "embedding_lay": [26, 27], "bot_nn": [26, 27, 33], "top_nn": [26, 27, 33], "interaction_op": [26, 27, 33], "interaction_out_dim": [26, 27, 32, 33], "els": [26, 27, 40, 41, 42, 47, 49, 51], "reshape_layer1": [26, 27, 33], "dense_x": [26, 27, 32, 33], "concat_featur": [26, 27, 30, 32, 33], "z": [26, 27, 32, 33], "emb_opt": 26, "get_embedding_optim": 26, "dense_opt": [26, 27], "get_dense_optim": 26, "embedding_sav": [26, 27], "load_embedding_valu": 26, "embedding_vari": [26, 27], "other_vari": 26, "split_embedding_variable_from_oth": 26, "emb_grad": 26, "optimizerscop": 26, "experimental_aggregate_gradi": 26, "793169": 26, "152": [26, 42], "323141": 26, "gpu_bfc_alloc": 26, "allow_growth": 26, "tf_force_gpu_allow_growth": 26, "323214": 26, "30997": 26, "078977": 26, "kit_cc": [26, 27], "kit_cc_infra": [26, 27], "src": [26, 27, 41], "107": 26, "local_replica_id": 26, "109": 26, "4287744788": 26, "raw_manag": [26, 27], "132": [26, 30, 53], "embeddingvari": [26, 27], "raw_param": 26, "120": [26, 31, 41, 47], "global_replica_id": 26, "137": [26, 28, 47], "facad": 26, "225": [26, 40, 47], "378": [26, 42, 53], "temporari": 26, "kit_cc_impl": [26, 27], "dumping_funct": [26, 27], "num_total_kei": 26, "total_max_vocabulary_s": 26, "350": 26, "upload": 26, "loop_num": 26, "260": 26, "235": [26, 40], "9379717111587524": 26, "12726": 26, "013671875": 26, "78772735595703": 26, "33247375488281": 26, "48320770263672": 26, "234": [26, 30], "79978942871094": 26, "6663873195648193": 26, "426162719726562": 26, "430748462677002": 26, "768443584442139": 26, "38544": 26, "distributed_embed": 26, "distrib": 26, "4160000": 26, "utedembed": 26, "second_order_feature_interacti": [26, 33], "ion": [26, 33], "second_order_feature_interactio": [26, 33], "127233": 26, "325": [26, 47], "777": [26, 30, 47, 53], "165": 26, "089529": 26, "untrac": [26, 33], "bottom_0_layer_call_fn": [26, 33], "bottom_0_layer_call_and_return_conditional_loss": [26, 33], "bottom_1_layer_call_fn": [26, 33], "bottom_1_layer_call_and_return_conditional_loss": [26, 33], "bottom_2_layer_call_fn": [26, 33], "callabl": [26, 33], "embeddingvariable_kei": [26, 27], "embeddingvariable_valu": [26, 27], "079021": [26, 27], "192": [26, 27, 41], "147": [26, 27, 40, 47], "18360": [26, 27], "rw": [26, 27, 53], "nobodi": [26, 27], "nogroup": [26, 27], "16640000": [26, 27], "jul": [26, 27], "2080000": [26, 27], "911439": 26, "490542": 26, "165777": 26, "043599": 26, "embeddings_peek": 26, "183": [26, 28, 33, 40], "184": 26, "682": 26, "689": 26, "736": [26, 53], "888": [26, 40], "4486": 26, "5745": 26, "255671": 26, "252879": 26, "252045": 26, "145888": 26, "6825647": 26, "6801282": 26, "68074": 26, "68074226": 26, "6818684": 26, "6809397": 26, "3980061": 26, "3981627": 26, "3980992": 26, "78289294": 26, "7833897": 26, "78293324": 26, "78336245": 26, "78305507": 26, "78301686": 26, "880705": 26, "88164043": 26, "88109225": 26, "87982655": 26, "88028604": 26, "88119066": 26, "8650326": 26, "86442304": 26, "86414057": 26, "8642554": 26, "8640611": 26, "8645548": 26, "783202": 26, "78315204": 26, "78240466": 26, "7826805": 26, "78258413": 26, "7824805": 26, "8573375": 26, "85796195": 26, "85979205": 26, "8595341": 26, "85846806": 26, "85798156": 26, "7563881": 26, "7563928": 26, "7564304": 26, "7563316": 26, "7563634": 26, "7564283": 26, "62020814": 26, "6213356": 26, "62018126": 26, "62036": 26, "6201106": 26, "6201722": 26, "85459447": 26, "85330284": 26, "854774": 26, "854769": 26, "8547034": 26, "85447353": 26, "64481944": 26, "6447684": 26, "6449137": 26, "64472693": 26, "64465916": 26, "64503783": 26, "7852191": 26, "78577": 26, "78521436": 26, "7852911": 26, "78544927": 26, "7853453": 26, "6184057": 26, "61849916": 26, "61735946": 26, "61852926": 26, "61921203": 26, "6175788": 26, "7092892": 26, "7092928": 26, "7092843": 26, "70928746": 26, "70928514": 26, "70928574": 26, "6360293": 26, "6360285": 26, "636029": 26, "63602984": 26, "63602865": 26, "63602734": 26, "69062346": 26, "69038725": 26, "690281": 26, "6907744": 26, "6904431": 26, "6903974": 26, "6840397": 26, "684031": 26, "68404853": 26, "6840508": 26, "68404937": 26, "68404216": 26, "7159784": 26, "71973306": 26, "7159706": 26, "7161063": 26, "71603465": 26, "71592766": 26, "67292804": 26, "67351913": 26, "67328465": 26, "67328894": 26, "6733438": 26, "67301095": 26, "68593156": 26, "6859398": 26, "68593466": 26, "6859294": 26, "6859311": 26, "68593705": 26, "72352993": 26, "7230278": 26, "72331727": 26, "72321206": 26, "72359455": 26, "7233958": 26, "60178": 26, "6017275": 26, "60140777": 26, "60140765": 26, "60151523": 26, "6015818": 26, "73245263": 26, "73322636": 26, "7328412": 26, "73278296": 26, "7325789": 26, "7329973": 26, "68950844": 26, "69225705": 26, "6898281": 26, "6889306": 26, "68944615": 26, "69020116": 26, "848309": 26, "84465414": 26, "84872234": 26, "8486877": 26, "84938526": 26, "8492384": 26, "701107": 26, "6997489": 26, "70110285": 26, "700902": 26, "7011098": 26, "70111394": 26, "5723409": 26, "5738345": 26, "5723305": 26, "57233423": 26, "57233775": 26, "572342": 26, "82768726": 26, "82793933": 26, "8282728": 26, "8282294": 26, "82802093": 26, "8280283": 26, "6491487": 26, "64926434": 26, "64963746": 26, "64926565": 26, "64935625": 26, "64957225": 26, "5615084": 26, "56340796": 26, "5635457": 26, "5635438": 26, "5613529": 26, "56135494": 26, "9477315": 26, "94783926": 26, "94776624": 26, "9477597": 26, "9477446": 26, "9477345": 26, "74906373": 26, "7491199": 26, "74906075": 26, "7490612": 26, "7490609": 26, "7490617": 26, "6141995": 26, "6144503": 26, "6139838": 26, "6140719": 26, "6141932": 26, "61409426": 26, "6773844": 26, "67902935": 26, "67736465": 26, "6773715": 26, "6773739": 26, "67744035": 26, "700472": 26, "70258003": 26, "69977176": 26, "70001334": 26, "75941193": 26, "7594471": 26, "75891864": 26, "7593392": 26, "75900066": 26, "75923026": 26, "tf_cpp_min_log_level": 27, "local_batch_s": 27, "1200": [27, 31, 51, 53], "tolist": 27, "sok_backend_typ": 27, "selcet": 27, "hkv": [27, 55], "det": [27, 55], "sparse_model_path": 27, "sok_embedding_table_path": 27, "sok_dlrm_spars": 27, "local_rank": 27, "generate_ragged_tensor_sampl": 27, "embedding_table_s": 27, "lookup_num": 27, "total_indic": 27, "reduce_sum": 27, "raggedtensor": 27, "from_row_length": 27, "total_data": 27, "dynamicvari": [27, 55], "lookup_spars": [27, 55], "sokemblay": 27, "embedding_dim": [27, 51], "var_typ": 27, "table_num": 27, "sok_var": [27, 55], "init_capac": 27, "max_capac": 27, "reshape_layer_list": 27, "sok_reshap": 27, "sok_concat1": 27, "ret_embed": 27, "embed_vec_dim": 27, "embedding_model": 27, "sok_embed": 27, "dense_reshape1": 27, "dense_concat1": 27, "dense_concat2": 27, "input_spars": 27, "sparse_input": 27, "dense_input": [27, 41], "get_embedding_model": 27, "get_embedding_vari": 27, "get_dense_vari": 27, "tmp_var": 27, "sparse_var": 27, "dense_var": 27, "filter_vari": 27, "embedding_load": [27, 55], "opt": [27, 30, 31, 32, 33, 35, 41, 43, 53], "embedding_var": 27, "embedding_dump": [27, 55], "trainer": 27, "distributedgradienttap": 27, "embedding_opt": 27, "optimizerwrapp": [27, 55], "emb_tap": 27, "dense_grad": 27, "embedding_grad": 27, "input_tupl": 27, "dump_model": 27, "du": 28, "lh": 28, "0m": [28, 33, 41, 49], "40m": 28, "multithread": 28, "jit": [28, 33], "fork": [28, 41], "ground": [28, 41], "truth": [28, 41], "modulelist": 28, "keys_list": 28, "annot": 28, "fut": 28, "preds_seq": 28, "preds_seq_gt": 28, "diff": [28, 41], "mse": [28, 41], "05": [28, 30, 31, 42, 44, 45, 46, 47, 49, 51, 53], "836": [28, 40], "839": [28, 47, 53], "use_hctr_cache_implement": [28, 30, 33, 55], "init_ec": [28, 30, 33], "840": [28, 31, 54], "880": [28, 47, 53], "936": 28, "pointer": 28, "975": 28, "018": [28, 33, 40], "041": [28, 40], "059": [28, 40, 42], "070": [28, 40], "088": [28, 40], "113": 28, "123": [28, 40, 41], "167": [28, 30, 41, 47], "196": [28, 31, 47], "210": [28, 34], "223": 28, "239": 28, "252": [28, 41], "284": [28, 40], "307": [28, 45, 47, 53], "319": [28, 40], "336": [28, 30, 53], "360": [28, 47, 53], "390": [28, 40], "409": [28, 40, 42, 53], "446": 28, "453": [28, 41], "515": [28, 30, 47], "535": 28, "560": [28, 47], "580": [28, 40], "597": 28, "606": [28, 40, 53], "615": [28, 40, 47], "624": [28, 33, 47], "632": 28, "668": [28, 40, 47, 53], "695": [28, 47, 53], "712": [28, 53], "725": [28, 47], "740": [28, 53], "768": [28, 40], "783": [28, 31, 40], "794": [28, 40, 47], "821": [28, 47], "844": [28, 47], "861": 28, "890": 28, "920": [28, 31, 47], "929": [28, 41, 42], "938": [28, 41], "957": [28, 31, 47], "979": [28, 40], "006": [28, 40, 53], "016": [28, 40], "027": [28, 40], "037": [28, 40], "046": [28, 40], "056": [28, 40], "064": [28, 33, 41, 42], "085": [28, 42], "095": 28, "110": 28, "125": 28, "136": [28, 47], "163": [28, 40, 47], "173": 28, "231": 28, "249": 28, "250": [28, 40, 41, 47], "10996460914611816": 28, "hps_torch_demo": 29, "plugin_lib_nam": [30, 31, 32, 33], "plugin_handl": [30, 31, 32, 33], "08": [30, 31, 33, 41, 47, 51, 53], "552734": 30, "litemodel": 30, "reduced_embed": 30, "reduce_mean": [30, 41], "keepdim": 30, "numrical_featur": [30, 33], "3fc_light": 30, "embedding_lookup_1": 30, "inputlai": 30, "er": 30, "up_1": 30, "reduce_mean_1": 30, "tfoplam": 30, "bda": 30, "p_1": 30, "141": 30, "145408": 30, "065": 30, "Then": [30, 31, 32, 33, 47, 48], "graphsurgoen": [30, 31, 32, 33], "deeplearningexampl": [30, 47], "quick": [30, 35], "spark": 30, "fast": [30, 50], "verif": 30, "final_output_dir": 30, "frequency_limit": 30, "roughli": 30, "quickli": [30, 50, 55], "haven": 30, "feauture_": 30, "npy": [30, 41], "deploy_path": 30, "hps_model": 30, "memb_vector": 30, "mkei": 30, "light": [30, 36], "enable_pagelock": [30, 33], "577492": 30, "runpi": [30, 33], "runtimewarn": [30, 33], "unpredict": [30, 33], "behaviour": [30, 33], "msg": [30, 33], "462": [30, 47, 53], "protobuf": [30, 33, 55], "extrem": [30, 33, 38], "slow": [30, 33], "1557": [30, 33], "tag": [30, 33, 35, 41, 55], "928": [30, 47], "signatur": [30, 33, 41], "serving_default": [30, 33], "signature_def": [30, 33], "440": [30, 31, 40, 41], "8f8d49": [30, 33], "opset": [30, 33], "459": 30, "fold": [30, 33], "482": [30, 47], "781": [30, 31, 41], "onnx_graphsurgeon": [30, 31, 32, 33], "shape_infer": [30, 31, 32, 33], "import_onnx": [30, 31, 32, 33], "statefulpartitionedcal": [30, 33], "unknown": [30, 32, 33], "hps_node": [30, 32, 33], "attr": [30, 31, 32, 33], "cleanup": [30, 31, 32, 33, 55], "toposort": [30, 31, 32, 33], "export_onnx": [30, 31, 32, 33], "3fc_light_with_hp": 30, "color": 30, "pip": [30, 41, 46, 47, 48, 49, 55], "distinct": 30, "139822124016208": 30, "139821990953120": 30, "unk__6": 30, "logger": [30, 31, 32, 33], "explicit_batch": [30, 31, 32, 33], "networkdefinitioncreationflag": [30, 31, 32, 33], "create_hps_plugin_cr": 30, "trt_version": 30, "__version__": 30, "init_libnvinfer_plugin": 30, "plg_registri": 30, "get_plugin_registri": 30, "plugin_cr": 30, "plugin_creator_list": 30, "hps_plugin_cr": 30, "get_plugin_cr": 30, "build_engine_from_onnx": [30, 31, 32, 33], "onnx_model_path": [30, 31, 32, 33, 41], "builder": [30, 31, 32, 33], "create_network": [30, 31, 32, 33], "onnxpars": [30, 31, 32, 33], "create_builder_config": [30, 31, 32, 33], "builder_config": [30, 31, 32, 33], "rb": [30, 31, 32, 33, 46, 48, 49], "set_flag": 30, "builderflag": [30, 33], "create_optimization_profil": [30, 31, 32, 33], "set_shap": [30, 31, 32, 33], "add_optimization_profil": [30, 31, 32, 33], "build_serialized_network": [30, 31, 32, 33], "serialized_engin": [30, 31, 32, 33], "dynamic_3fc_light": 30, "fout": [30, 31, 32, 33], "memusagechang": [30, 31, 32, 33], "974": [30, 40], "2531": 30, "661": 30, "2943": 30, "735": 30, "lazi": [30, 31, 32, 33, 55], "regist": [30, 31, 32, 33, 46], "plugin_vers": [30, 31, 32, 33], "plugin_namespac": [30, 31, 32, 33], "116": [30, 31, 40, 53], "117": [30, 47], "140": [30, 41], "227": [30, 32, 47], "ktf32": [30, 33], "0088975": 30, "cublaslt": [30, 31, 32, 33, 55], "2952": 30, "12129": 30, "349": [30, 53], "190": 30, "3301": 30, "12319": 30, "against": 30, "persist": [30, 31, 32, 33, 40, 55], "16672": 30, "memusagestat": [30, 31, 32, 33], "1248": 30, "blockassign": [30, 31, 32, 33], "shift": [30, 31, 32, 33], "shiftntopdown": [30, 31, 32, 33], "took": [30, 31, 32, 33], "040758m": 30, "905970176": 30, "905969664": 30, "3302": 30, "12397": 30, "12407": 30, "encount": [30, 55], "affect": [30, 55], "accuraci": [30, 55], "subnorm": 30, "dynamic_3fc_lite_hps_trt": 30, "tensorrt_plan": [30, 31, 32, 33], "type_int32": [30, 31, 32, 33], "mmodel_repo": 30, "pythonpath": 30, "tensorflow2": 30, "dlrm_and_dcnv2": 30, "perf_data": 30, "minut": 30, "finish": [30, 31, 40, 41, 42, 53], "spark2json": 30, "dataset_path": 30, "binary_split_converted_data": 30, "num": [30, 31, 40, 41, 42, 51, 53], "2000000": [30, 42], "grpcinferenceservic": 30, "8001": 30, "httpservic": 30, "8002": 30, "sh": [30, 36, 38, 40, 41], "echo": [30, 41], "bash": [30, 38, 40], "25600": 30, "time_window": 30, "window": 30, "5000": [30, 31, 42, 51, 55], "msec": 30, "20941": 30, "1163": 30, "sec": 30, "851": 30, "standard": [30, 50, 55], "deviat": [30, 50], "1184": 30, "p50": 30, "p90": 30, "922": 30, "p95": 30, "977": 30, "p99": 30, "1190": 30, "846": [30, 41], "recv": 30, "343": 30, "108": [30, 47], "12800": 30, "14135": 30, "785": [30, 31, 40], "143": [30, 47], "1264": 30, "286": [30, 31, 40], "1236": 30, "1340": 30, "1374": 30, "1476": 30, "1258": 30, "1166": 30, "889": [30, 40], "619": [30, 40], "156": [30, 41, 47], "6400": 30, "8116": 30, "450": 30, "826": 30, "2206": [30, 32], "391": [30, 42, 47], "2183": 30, "2321": 30, "2368": 30, "2486": 30, "2199": 30, "118": [30, 47, 53], "2081": 30, "1632": 30, "1173": 30, "3200": [30, 51], "5311": 30, "295": [30, 41, 47], "3377": 30, "3349": 30, "3486": 30, "3530": 30, "3820": 30, "3370": 30, "155": 30, "3215": 30, "2591": 30, "162": [30, 45, 47], "2068": 30, "1600": [30, 51, 53], "3518": 30, "5109": 30, "5068": 30, "5242": 30, "5316": 30, "5741": 30, "5104": 30, "4933": 30, "4134": 30, "138": 30, "3742": 30, "800": [30, 31, 40, 41, 51, 53], "1910": 30, "9412": 30, "9384": 30, "9529": 30, "9581": 30, "10106": 30, "9406": 30, "294": [30, 32, 53], "9112": 30, "7674": 30, "267": 30, "7179": 30, "130": [30, 47], "400": [30, 31, 40, 41, 51, 53], "992": [30, 33], "1033": 30, "18132": 30, "726": 30, "18051": 30, "18257": 30, "18330": 30, "23069": 30, "18125": 30, "1278": 30, "16847": 30, "14999": 30, "476": [30, 40, 47], "14234": 30, "203": [30, 33, 41], "6081": 30, "34878": 30, "34734": 30, "35143": 30, "35288": 30, "40804": 30, "34872": 30, "2584": 30, "32288": 30, "516": [30, 40], "29340": 30, "870": [30, 47], "28111": 30, "270": [30, 31], "253": [30, 40], "053": 30, "71063": 30, "1570": 30, "70749": 30, "71666": 30, "73226": 30, "77979": 30, "71058": 30, "5092": 30, "65966": 30, "60716": 30, "1804": 30, "58482": 30, "333": [30, 40], "argpars": [30, 40, 42, 47], "argumentpars": [30, 40, 42], "glob": [30, 42, 47, 50], "defaultdict": [30, 46], "log_pattern": 30, "inference_benchmark": 30, "cmd_log": 30, "result_log": 30, "extract_result_from_log": 30, "log_path": 30, "job_log_pattern": 30, "readlin": 30, "job_log": 30, "each_job_log": 30, "add_argu": [30, 40, 42], "parse_arg": [30, 40, 42], "perf_result": 30, "idx": [30, 32], "tresult": 30, "prebuilt": 30, "undergo": 30, "soon": 30, "arm": 30, "particular": [30, 35, 50, 55], "yourself": [30, 43], "setup": [30, 35, 43, 55], "contrast": 30, "advis": 30, "slight": 30, "alter": 30, "nvstage": 30, "dockerfil": [30, 35], "ctr": [30, 35, 37, 38, 39, 56], "sed": 30, "duse_huge_pag": 30, "action": [30, 40], "sudo": 30, "180000": 30, "node0": 30, "hugepag": [30, 41], "2048kb": 30, "nr_hugepag": 30, "reus": 30, "accomplish": 30, "suggest": 30, "hctr_src": 30, "chmod": 30, "lab": [30, 47, 48, 55], "predcondit": 30, "outlin": [30, 35], "itself": 30, "data_parquet": [31, 41], "561": [31, 41, 47], "564": [31, 40, 41], "568": [31, 40, 41, 47], "gen_0": [31, 41, 53], "204": [31, 42], "gen_1": [31, 41, 53], "455": 31, "gen_2": [31, 41, 53], "709": 31, "gen_3": [31, 41, 53], "gen_4": [31, 41, 53], "gen_5": [31, 41, 53], "gen_6": [31, 41, 53], "gen_7": [31, 41, 53], "gen_8": [31, 41, 53], "gen_9": [31, 41, 53], "411": [31, 47, 53], "gen_10": [31, 41, 53], "650": [31, 40], "gen_11": [31, 41, 53], "885": [31, 40, 47], "gen_12": [31, 41, 53], "gen_13": [31, 41, 53], "341": [31, 47], "gen_14": [31, 41, 53], "577": [31, 41], "gen_15": [31, 41, 53], "818": 31, "827": 31, "066": [31, 53], "537": [31, 40], "751": [31, 40], "mpi4pi": [31, 40, 41, 42, 43, 51, 53], "0001": [31, 32, 42], "dlrm_hugectr_graph": 31, "dlrm_hugectr": 31, "cuipcopenmemhandle_v2": 31, "gnu": [31, 41], "libcuda": 31, "539": [31, 40], "2950905596": 31, "542": [31, 47], "698": 31, "peer": [31, 40, 41, 42, 51, 53], "all2al": [31, 40, 41, 42, 51, 53, 55], "699": [31, 41, 47], "700": [31, 40, 47, 51, 53], "705": [31, 47], "782": [31, 47], "max_vocabulary_size_per_gpu_": [31, 41, 42, 51, 53], "3413333": 31, "791": [31, 40, 41, 47], "analysi": [31, 40, 41, 42, 51, 53, 55], "795": [31, 40], "772": [31, 40, 41, 47], "gpu0": [31, 41, 42, 51, 53], "warm": [31, 36, 41, 42, 51, 53, 55], "480": [31, 40, 53], "001000": [31, 41, 42, 51, 53], "522": [31, 40, 47], "72017": 31, "693168": [31, 53], "64947": 31, "694016": 31, "600": [31, 40, 41, 51, 53], "60927": 31, "69323": 31, "432": [31, 47], "60078": 31, "693079": 31, "050": [31, 40], "60162": 31, "693134": 31, "206": [31, 41], "498656": 31, "156138": 31, "rank0": [31, 41, 42, 51, 53], "456": [31, 47, 53], "958": [31, 40, 47], "optimz": [31, 41, 42, 51, 53], "514": [31, 40, 47], "555": [31, 47], "693": 31, "694": 31, "823": [31, 42, 47], "414": [31, 40], "dlrm_hugectr0_sparse_1000": 31, "dlrm_hugectr_dense_1000": 31, "dlrm_hugectr_dens": 31, "graph_config": [31, 41], "convert_embed": [31, 41], "unknown_1": 31, "elif": [31, 32, 40], "unknown_2": 31, "dlrm_hugectr_with_hp": 31, "dlrm_with_hp": 31, "262": [31, 41], "1014": 31, "886": [31, 40], "1239": 31, "cuda_module_load": [31, 32], "env": [31, 32, 33, 53], "onnx2trt_util": [31, 32, 33], "377": [31, 32, 40, 47], "down": [31, 32, 33], "812": [31, 47], "813": 31, "189": 31, "239950": 31, "205": [31, 41], "419": [31, 40], "335": [31, 40], "146": 31, "5763": 31, "1314": 31, "5879": 31, "1368": 31, "kfaster_dynamic_shapes_0805": 31, "preview": [31, 55], "34118830080": 31, "20304": 31, "10752": 31, "scratch": [31, 32, 33, 35, 36, 55], "32505856": 31, "4628": 31, "09284m": 31, "48099840": 31, "6321": 31, "1580": 31, "6322": 31, "1590": 31, "ten": [31, 32, 33], "cmdline": [31, 32, 33], "con": [31, 32, 33], "sorrt": [31, 32, 33], "libtriton_tensorrt": [31, 32, 33], "capab": [31, 32, 33], "iliti": [31, 32, 33], "ectori": [31, 32, 33], "bac": [31, 32, 33], "kend": [31, 32, 33], "shutil": [31, 32, 33, 42, 50], "as_numpi": [31, 32, 33], "49642828": 31, "52846366": 31, "99999994": 31, "9999992": 31, "9999905": 31, "dataload": [32, 47], "dlrm_pytorch": 32, "dlrm_pytorch_spars": 32, "onnx_path": 32, "modified_onnx_path": 32, "dlrm_pytorch_with_hp": 32, "tqdm": [32, 46, 47, 48, 51], "tqdmwarn": 32, "iprogress": 32, "ipywidget": [32, 47], "readthedoc": 32, "en": 32, "stabl": 32, "user_instal": 32, "autonotebook": 32, "notebook_tqdm": 32, "sequenti": [32, 47], "add_modul": 32, "_linear_layer_": 32, "_relu_layer_": 32, "inplac": [32, 47, 51], "transpos": 32, "index_select": 32, "from_pretrain": [32, 48], "bot_mlp": 32, "interaction_lay": 32, "top_mlp": 32, "criterion": 32, "bceloss": 32, "x0_iter": 32, "from_numpi": 32, "pin_memori": 32, "drop_last": 32, "x1_iter": 32, "y_iter": 32, "squeez": [32, 33, 47, 48], "zero_grad": 32, "state_dict": [32, 47], "bottom_linear_layer_1": 32, "in_featur": [32, 47], "out_featur": [32, 47], "bottom_relu_layer_1": 32, "bottom_linear_layer_2": 32, "bottom_relu_layer_2": 32, "bottom_linear_layer_3": 32, "bottom_relu_layer_3": 32, "top_linear_layer_1": 32, "479": [32, 33, 40], "top_relu_layer_1": 32, "top_linear_layer_2": 32, "top_relu_layer_2": 32, "top_linear_layer_3": 32, "top_relu_layer_3": 32, "top_linear_layer_4": 32, "top_relu_layer_4": 32, "top_linear_layer_5": 32, "top_relu_layer_5": 32, "1652954816818237": 32, "7626148462295532": 32, "1845550537109375": 32, "7347715497016907": 32, "0786197185516357": 32, "9271171689033508": 32, "7060756683349609": 32, "7490934133529663": 32, "8274499773979187": 32, "7962949275970459": 32, "6947690844535828": 32, "7241608500480652": 32, "7649394869804382": 32, "7043794393539429": 32, "6948238611221313": 32, "7003152370452881": 32, "7330600619316101": 32, "711887001991272": 32, "6917610168457031": 32, "7227296233177185": 32, "7232402563095093": 32, "7025701999664307": 32, "6962350010871887": 32, "7100769281387329": 32, "7159318923950195": 32, "6963521242141724": 32, "7058508396148682": 32, "7144895792007446": 32, "7082542181015015": 32, "6955724954605103": 32, "6997341513633728": 32, "7167338132858276": 32, "6962475776672363": 32, "6955674290657043": 32, "7098587155342102": 32, "6992183327674866": 32, "6928209066390991": 32, "6933107972145081": 32, "697549045085907": 32, "6969214677810669": 32, "6935250163078308": 32, "6948344111442566": 32, "7015650868415833": 32, "6928752660751343": 32, "6936203837394714": 32, "6962599158287048": 32, "6941655278205872": 32, "6939643025398254": 32, "6933950185775757": 32, "6970551013946533": 32, "0014": 32, "9997": 32, "9991": 32, "0004": 32, "0005": 32, "0002": 32, "dummy_kei": 32, "dummy_numerical_featur": 32, "randn": 32, "input_nam": 32, "output_nam": [32, 41], "dynamic_ax": 32, "ipykernel_52545": 32, "1281679600": 32, "tracerwarn": 32, "incorrect": 32, "stride": [32, 47], "requires_grad": 32, "gather_output_0": 32, "onnx_nam": 32, "gemm_output_0": 32, "gemm": [32, 55], "transb": 32, "114": [32, 40, 47, 54], "relu_output_0": 32, "1455": 32, "constant_output_0": 32, "cpulongtyp": 32, "reshape_output_0": 32, "allowzero": 32, "concat_output_0": 32, "3456": 32, "transpose_output_0": 32, "perm": 32, "matmul_output_0": 32, "729": [32, 47], "gather_33": 32, "351": [32, 33, 40], "concat_1_output_0": 32, "268": 32, "1035": 32, "497": 32, "1259": 32, "543": [32, 47], "652": [32, 40], "653": [32, 40, 47, 53], "209": [32, 47], "220": 32, "280": [32, 41], "433": 32, "331": [32, 47, 53], "144": [32, 33, 47], "5771": 32, "933": [32, 40], "115": [32, 40, 47], "5886": 32, "987": [32, 53], "34103362048": 32, "45142016": 32, "011619m": 32, "58774016": 32, "5933": 32, "1043": 32, "5128022": 32, "51312006": 32, "51246136": 32, "5129204": 32, "51302147": 32, "513144": 32, "dlrm_tf": 33, "dlrm_tf_spars": 33, "032517": 33, "963734": 33, "1638": 33, "30974": 33, "171392": 33, "2197505": 33, "897": [33, 47], "578464": 33, "executor": 33, "1209": 33, "abort": 33, "invalid_argu": 33, "_2": 33, "51200": 33, "892396": 33, "xla": 33, "169": [33, 42, 47], "0x55e0fdfeb330": 33, "892450": 33, "streamexecutor": 33, "897903": 33, "mlir": 33, "dump_mlir_util": 33, "269": [33, 47], "crash": [33, 55], "mlir_crash_reproducer_directori": 33, "379151": 33, "stream_executor": 33, "cuda_dnn": 33, "424": [33, 40], "8902": 33, "502058": 33, "device_compil": 33, "lifetim": [33, 55], "_baseoptim": 33, "_update_step_xla": 33, "0x7fa9660adab0": 33, "reduce_retrac": 33, "68028259277344": 33, "2571352064": 33, "639234": 33, "4132346": 33, "20792958": 33, "5957": 33, "8994140625": 33, "231005": 33, "96875": 33, "185315": 33, "3125": 33, "151740": 33, "43695": 33, "6640625": 33, "45556": 33, "24609375": 33, "131654": 33, "78125": 33, "8805829286575317": 33, "49121": 33, "47265625": 33, "60609": 33, "62109375": 33, "676294": 33, "375": [33, 40, 47], "31208": 33, "66015625": 33, "156789": 33, "65625": 33, "103213": 33, "1015625": 33, "394046783447266": 33, "10789": 33, "5703125": 33, "2716": 33, "05859375": 33, "139559": 33, "130419": 33, "13583": 33, "6923828125": 33, "7378": 33, "22802734375": 33, "81185": 33, "40625": 33, "18370": 33, "3314": 33, "90478515625": 33, "15871": 33, "3154296875": 33, "545": [33, 40, 47], "2841796875": 33, "1281": 33, "3038330078125": 33, "52890": 33, "2550": 33, "232177734375": 33, "4526": 33, "03759765625": 33, "5832462310791": 33, "22301483154297": 33, "7525691986084": 33, "034607887268066": 33, "6510401964187622": 33, "275766372680664": 33, "707094430923462": 33, "7623991966247559": 33, "5783321857452393": 33, "8166252374649048": 33, "885994553565979": 33, "912842869758606": 33, "7323049902915955": 33, "7469371557235718": 33, "8475004434585571": 33, "serializ": 33, "get_config": 33, "proper": 33, "248789": 33, "721088": 33, "126": 33, "926": [33, 47], "868": [33, 40, 41, 47], "302": [33, 41, 47, 55], "255": [33, 41, 47, 53], "04": [33, 42, 44, 45, 47, 50, 51, 53], "unsqueez": [33, 47], "dlrm_tf_with_hp": 33, "2013": 33, "4018": 33, "721": 33, "421": [33, 40], "4516": 33, "793": [33, 40, 47], "374": 33, "774": [33, 47], "fp8_quant": [33, 55], "775": 33, "860": [33, 40, 47], "863": 33, "864": 33, "869": [33, 40, 42, 47], "902": [33, 42], "947": [33, 40, 41], "51968": 33, "047": [33, 40], "069": [33, 40, 42], "077": 33, "034216": 33, "8710": 33, "1051": 33, "8711": 33, "18350080": 33, "007954m": 33, "31981568": 33, "8764": 33, "1091": 33, "1101": 33, "00mdlrm_tf_with_hp": 33, "00mconfig": 33, "tritonbackend_modelinstanceiniti": 33, "dlrm_tf_with_hps_0": 33, "34091672": 33, "demo_for_pytorch_trained_model": 34, "demo_for_hugectr_trained_model": 34, "instal": [34, 35, 41, 43, 46, 47, 48, 49, 50, 53, 55], "benchmark_tf_trained_large_model": 34, "147gb": [34, 55], "interconnect": 34, "bz": 34, "2tb": 34, "gen4": 34, "1396": [34, 41], "sxm5": 34, "platinum": 34, "8480c": 34, "gen5": 34, "773": [34, 40, 41, 47], "nvl": 34, "94gb": 34, "grace": [34, 55], "480gb": 34, "c2c": 34, "grate": 35, "interest": 35, "submit": [35, 54], "bug": [35, 55], "review": [35, 44], "think": 35, "priorit": 35, "comment": [35, 55], "propos": 35, "ahead": [35, 55], "pend": [35, 55], "forget": 35, "properli": [35, 41, 55], "ask": 35, "approv": 35, "clarif": [35, 55], "hesit": 35, "promptli": 35, "contributor": [35, 38, 55], "journei": 35, "1007": 35, "56a762eae3f8": 35, "dst_imag": 35, "docker_fil": 35, "rmm_ver": 35, "vnightli": 35, "cudf_ver": 35, "nvtab_ver": 35, "hugectr_dev_mod": 35, "cli": [35, 41], "varnam": 35, "quiet": 35, "suppress": [35, 55], "devel": 35, "cmake_build_typ": 35, "eval_batch": [35, 55], "enable_multinod": [35, 43], "enable_infer": 35, "enable_hdf": 35, "enable_s3": [35, 53], "amazon": [35, 55], "sdk": [35, 53], "skk": 35, "AND": 35, "denable_hdf": [35, 36], "denable_s3": [35, 53], "denable_multinod": [35, 43], "cmake_install_prefix": [35, 43, 55], "dcmake_install_prefix": [35, 43], "devel_infer": 35, "full": [36, 40, 46, 55], "varieti": 36, "8xa100": 36, "localizedslotembeddinghash": 36, "aren": 36, "distributedslotembeddinghash": 36, "localizedslotembeddingonehot": 36, "gender": 36, "wouldn": 36, "easi": [36, 55], "openmpi": 36, "gpudirect": 36, "dcn_2node_8gpu": 36, "footprint": 36, "tensorcor": 36, "mixed_precis": 36, "arithmet": 36, "underflow": 36, "exchang": [36, 54], "onnx_convert": [36, 41, 55], "hugectr2onnx_demo": 36, "ofembed": 36, "thing": 36, "redund": 36, "novelgpu": 36, "forintegr": 36, "hugectr_wdl_predict": 36, "hierrach": 36, "difficult": 36, "confer": 37, "websit": [37, 39], "titl": [37, 45], "date": 37, "speaker": 37, "video": [37, 44], "episod": 37, "\u52a0\u901f\u7684\u63a8\u8350\u7cfb\u7edf\u6846\u67b6": 37, "joei": 37, "wang": 37, "\u4e2d\u6587": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u5982\u4f55\u52a0\u901f\u63a8\u7406": 37, "\u4f7f\u7528": 37, "\u52a0\u901f": 37, "\u8bad\u7ec3": 37, "gem": 37, "guo": 37, "gtc": 37, "sping": 37, "march": 37, "matthia": [37, 43], "langer": [37, 43], "yingcan": [37, 43], "wei": [37, 43], "yu": 37, "fan": [37, 40], "english": 37, "apsara": 37, "\u63a8\u8350\u7cfb\u7edf": 37, "oct": 37, "spring": 37, "tencent": 37, "advertis": [37, 55], "april": 37, "xiangt": 37, "kong": 37, "Into": 37, "minseok": 37, "lee": 37, "jianb": 37, "dong": 37, "china": 37, "2020": [37, 53], "\u6df1\u5165\u7814\u7a76\u6027\u80fd\u4f18\u5316": 37, "\u6027\u80fd\u63d0\u5347": 37, "\u500d": 37, "\u7684\u9ad8\u6027\u80fd": 37, "\u5e7f\u544a\u63a8\u8350\u52a0\u901f\u7cfb\u7edf\u7684\u843d\u5730\u5b9e\u73b0": 37, "\u63a8\u7406\u8fc7\u7a0b": 37, "\u5c06": 37, "\u96c6\u6210\u4e8e": 37, "estim": [37, 38, 39, 55, 56], "2019": 37, "\u52a0\u901f\u7684\u63a8\u8350\u7cfb\u7edf\u8bad\u7ec3": 37, "wechat": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e09": 37, "\u96c6\u6210\u5230tensorflow": 37, "nov": 37, "devblog": 37, "\u5206\u5c42\u53c2\u6570\u670d\u52a1\u5668\u6269\u5c55\u63a8\u8350\u7cfb\u7edf\u63a8\u7406": 37, "august": 37, "shashank": 37, "verma": 37, "wenwen": 37, "gao": 37, "jerri": [37, 43], "shi": [37, 43], "kit": [37, 43, 55], "\u7cfb\u5217\u4e4b\u4e8c": 37, "june": 37, "kunlun": 37, "li": 37, "\u7cfb\u5217\u4e4b\u4e00": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e8c": 37, "\u5206\u7ea7\u53c2\u6570\u670d\u52a1\u5668\u7cfb\u5217\u4e4b\u4e00": 37, "jan": 37, "sept": 37, "vinh": [37, 43], "nguyen": [37, 43], "ann": 37, "spencer": 37, "meituan": 37, "interview": 37, "jun": [37, 40], "huang": 37, "sheng": 37, "luo": 37, "benedikt": 37, "schiffer": 37, "\u6269\u5c55\u548c\u52a0\u901f\u5927\u578b\u6df1\u5ea6\u5b66\u4e60\u63a8\u8350\u7cfb\u7edf": 37, "\u7cfb\u5217\u7b2c": 37, "\u90e8\u5206": 37, "\u7684": 37, "\u8bad\u7ec3\u5927\u578b\u6df1\u5ea6\u5b66\u4e60\u63a8\u8350\u6a21\u578b": 37, "ashish": 37, "sardana": 37, "ir": 37, "aug": 37, "oldridg": 37, "juli": 37, "massiv": [38, 55], "bottleneck": [38, 47], "record": [38, 42, 55], "homogen": 38, "easier": [38, 55], "sign": 38, "advanc": 38, "p100": 38, "pascal": 38, "team": [38, 55], "research": 38, "dcn_norm_generate_train": 38, "wdl_norm_generate_train": 38, "dlrm_raw_generate_train": 38, "dcn_parquet_generate_train": 38, "criteo_data": [38, 40], "panda": [38, 40, 41, 45, 46, 49, 51, 55], "introduct": [39, 55], "overarch": 39, "bring": 39, "cell": [40, 41, 43], "shell": 40, "softlink": 40, "kaggl": [40, 55], "occurr": 40, "postfix": [40, 50], "day_1": 40, "wdl_data": 40, "3rd": 40, "4th": 40, "embodi": 40, "5th": 40, "6th": 40, "soft": [40, 42], "project_root": 40, "home": 40, "wget": [40, 41, 42, 46], "cail": [40, 42], "day_0": [40, 42], "gz": [40, 41, 42], "deepfm_data_nvt": 40, "nvt": [40, 42, 50, 51], "ln": [40, 41, 42], "smi": 40, "460": [40, 47], "disp": 40, "uncorr": 40, "ecc": 40, "temp": [40, 42], "perf": [40, 55], "pwr": 40, "mig": 40, "00000000": 40, "33c": 40, "p0": 40, "42w": 40, "300w": 40, "0mib": 40, "16160mib": 40, "35c": 40, "45w": 40, "36c": 40, "44w": 40, "8a": [40, 41], "34c": 40, "41w": 40, "gi": 40, "ci": 40, "pid": 40, "dlrm_train": [40, 55], "use_dynamic_hash_t": 40, "shard_plan": 40, "round_robin": 40, "store_tru": 40, "generate_shard_plan": 40, "target_gpu": 40, "gpu_id": 40, "mp_tabl": 40, "6000": [40, 42], "dp_tabl": 40, "use_embedding_collect": 40, "num_embed": 40, "ebc": 40, "emb_vec_list": 40, "emb_vec": 40, "relu3": [40, 53], "relu4": [40, 53], "fc5": [40, 53], "relu5": [40, 53], "fc6": [40, 53], "relu6": [40, 53], "fc7": [40, 53], "relu7": [40, 53], "fc8": [40, 53], "3508545476": 40, "637": 40, "4714": 40, "4441": 40, "609": [40, 53], "5378": 40, "5339": 40, "4636": 40, "4480": 40, "4949": 40, "5183": 40, "789": [40, 53], "790": 40, "792": [40, 41], "919": [40, 42], "max_row_group_s": [40, 41, 42], "133678": 40, "022": 40, "134102": 40, "029": 40, "0804": 40, "0457": 40, "030": 40, "0183": 40, "032": 40, "1121": 40, "033": 40, "035": 40, "0378": 40, "0222": 40, "038": 40, "0691": 40, "039": 40, "0925": 40, "9636": 40, "043": 40, "9363": 40, "044": 40, "0300": 40, "0261": 40, "9558": 40, "049": 40, "9402": 40, "9871": 40, "052": 40, "0105": 40, "6863": 40, "224": [40, 47], "6589": 40, "330": 40, "7527": 40, "474": 40, "7488": 40, "6785": 40, "646": 40, "6628": 40, "755": [40, 53], "7097": 40, "7332": 40, "040": 40, "4089": 40, "175": [40, 47], "3816": 40, "4753": 40, "467": [40, 47, 53], "617": [40, 47, 54], "4011": 40, "3855": 40, "921": 40, "4324": 40, "063": [40, 42], "4558": 40, "221": 40, "1016": 40, "7546": 40, "7253": 40, "410": [40, 47, 53], "8425": 40, "412": [40, 42, 53], "8308": 40, "413": [40, 41, 42, 47, 53], "7957": 40, "9031": 40, "415": [40, 53], "9578": 40, "417": 40, "6531": 40, "418": 40, "6238": 40, "420": [40, 47], "8386": 40, "7410": 40, "422": 40, "7292": 40, "6941": 40, "425": [40, 42], "8015": 40, "426": 40, "8562": 40, "558": [40, 47], "4051": 40, "1921": 40, "567": [40, 41], "1628": 40, "570": [40, 47], "3777": 40, "573": 40, "2800": [40, 51], "576": 40, "2683": 40, "579": 40, "2332": 40, "582": 40, "3406": 40, "585": 40, "3953": 40, "587": [40, 47], "0088": [40, 41], "1824": 40, "1531": 40, "589": [40, 41], "3679": 40, "590": [40, 47], "2703": 40, "591": 40, "2585": 40, "592": 40, "2234": 40, "593": 40, "3308": 40, "595": [40, 47], "457": 40, "data0": 40, "data3": 40, "data4": 40, "data5": 40, "data6": 40, "data7": 40, "data8": 40, "data9": 40, "data10": 40, "data11": 40, "data12": 40, "data13": 40, "data14": 40, "data15": 40, "data16": 40, "data17": 40, "data18": 40, "data19": 40, "data20": 40, "data21": 40, "data22": 40, "data23": 40, "data24": 40, "data25": 40, "embeddingcollection0": 40, "emb_vec0": 40, "emb_vec1": 40, "emb_vec2": 40, "emb_vec3": 40, "emb_vec4": 40, "emb_vec5": 40, "emb_vec6": 40, "emb_vec7": 40, "emb_vec8": 40, "emb_vec9": 40, "emb_vec10": 40, "emb_vec11": 40, "emb_vec12": 40, "emb_vec13": 40, "emb_vec14": 40, "emb_vec15": 40, "emb_vec16": 40, "emb_vec17": 40, "emb_vec18": 40, "emb_vec19": 40, "emb_vec20": 40, "emb_vec21": 40, "emb_vec22": 40, "emb_vec23": 40, "emb_vec24": 40, "emb_vec25": 40, "500000": [40, 41], "458": 40, "14373": 40, "24478": 40, "697": [40, 47], "23782": 40, "142604": 40, "168333": 40, "865": 40, "142137": 40, "25698": 40, "19912": 40, "142685": 40, "1404": 40, "24589": 40, "18021": 40, "143021": 40, "211": [40, 42], "139695": 40, "25073": 40, "245": 40, "16407": 40, "141111": 40, "13893": 40, "24958": 40, "17112": 40, "141069": 40, "138218": 40, "25123": 40, "18422": 40, "135439": 40, "759": 40, "137244": 40, "25471": 40, "803": [40, 53], "19334": 40, "139792": 40, "136812": 40, "2416": 40, "17574": 40, "140519": 40, "135968": 40, "25386": 40, "18238": 40, "134846": 40, "291": [40, 55], "134873": 40, "23619": 40, "3445591887": 40, "383": 40, "384": [40, 47], "385": [40, 42, 47], "386": 40, "628": 40, "643": [40, 41, 47], "651": [40, 47], "654": 40, "939": [40, 41], "946": [40, 41, 47], "997": 40, "0258": 40, "0417": 40, "0144": 40, "011": [40, 41, 42, 53], "1042": 40, "015": 40, "0339": 40, "020": 40, "024": [40, 41], "0652": 40, "0886": [40, 41], "071": 40, "075": [40, 42], "9285": 40, "084": 40, "9480": 40, "092": [40, 41], "9324": 40, "9792": [40, 42], "101": 40, "0027": 40, "332": [40, 55], "9753": 40, "746": 40, "748": [40, 47], "749": 40, "9675": 40, "752": 40, "9519": 40, "9988": 40, "757": 40, "8738": 40, "8464": 40, "760": 40, "762": [40, 47, 53], "763": 40, "8660": 40, "765": [40, 47], "8503": 40, "767": 40, "8972": 40, "9207": 40, "911": 40, "917": 40, "4128": 40, "924": 40, "4792": 40, "930": 40, "4050": 40, "3894": 40, "937": [40, 41, 47], "4363": 40, "940": [40, 41], "4597": 40, "941": [40, 41], "4031": 40, "942": [40, 47], "3757": 40, "944": [40, 47], "4695": 40, "945": [40, 47], "4656": 40, "3796": 40, "948": [40, 47], "4265": 40, "950": [40, 47], "4500": [40, 51], "841": [40, 47], "842": [40, 47], "251": [40, 53], "143524": 40, "34586": 40, "345": [40, 47], "48449": 40, "142247": 40, "657": 40, "141641": 40, "33134": 40, "40384": 40, "142243": 40, "139913": 40, "33118": 40, "161": 40, "40793": 40, "142713": 40, "138901": 40, "34956": 40, "40618": 40, "140238": 40, "883": 40, "138208": 40, "34071": 40, "38745": 40, "140117": 40, "326": 40, "137638": 40, "34076": 40, "42352": 40, "135055": 40, "727": [40, 47, 53], "137268": 40, "728": 40, "33588": 40, "819": [40, 53], "38619": 40, "139783": 40, "193": 40, "136816": 40, "3762": 40, "43341": 40, "140772": 40, "581": [40, 47], "136368": 40, "3521": 40, "673": 40, "41807": 40, "135264": 40, "985": 40, "135726": 40, "34242": 40, "198655838": 40, "517": 40, "730": [40, 47], "731": 40, "732": 40, "896": 40, "907": 40, "913": [40, 47], "914": 40, "915": [40, 47], "969": 40, "002": 40, "004": 40, "005": [40, 53], "007": [40, 53], "008": [40, 53], "012": 40, "013": 40, "014": 40, "017": 40, "021": 40, "023": 40, "025": 40, "081": 40, "121": [40, 41], "423": [40, 41, 47], "505": [40, 53], "145": 40, "559": [40, 42, 47], "747": [40, 47], "275": 40, "091": [40, 42], "133": [40, 42], "361": [40, 42, 53], "0203": 40, "364": [40, 42, 55], "365": [40, 41, 42, 53], "0515": 40, "367": 40, "9460": 40, "0046": 40, "9890": 40, "371": [40, 47], "1355": 40, "372": 40, "8269": 40, "373": [40, 47], "9187": 40, "376": 40, "9500": 40, "8445": 40, "8875": 40, "3660": 40, "525": [40, 47], "4578": 40, "528": 40, "531": [40, 53], "4890": 40, "3835": 40, "538": 40, "4421": 40, "544": [40, 42, 47], "5730": 40, "3562": 40, "546": [40, 47], "548": [40, 47], "550": [40, 47], "3738": 40, "552": [40, 47], "4167": 40, "5632": 40, "594": 40, "599": 40, "144991": 40, "22035": 40, "633": [40, 47], "03885": 40, "144124": 40, "144851": 40, "1863": 40, "98102": 40, "145444": 40, "540": 40, "141821": 40, "18638": 40, "96441": 40, "144249": 40, "139519": 40, "18203": 40, "556": [40, 41, 47], "97548": 40, "140895": 40, "490": 40, "13942": 40, "491": 40, "19363": 40, "533": 40, "97628": 40, "141202": 40, "465": [40, 47], "13947": 40, "18342": 40, "97817": 40, "136504": 40, "138534": 40, "19586": 40, "96355": 40, "14067": 40, "138213": 40, "20188": 40, "98811": 40, "142139": 40, "138044": 40, "19324": 40, "427": [40, 47, 50], "96149": 40, "136835": 40, "137419": 40, "18732": 40, "grow": [40, 55], "1217153067": 40, "506": 40, "485": [40, 41, 47], "486": 40, "662": 40, "669": 40, "670": 40, "671": [40, 42, 47], "672": [40, 47], "862": [40, 49], "866": [40, 47], "871": 40, "872": [40, 53], "873": [40, 41, 42], "875": [40, 53], "876": 40, "878": 40, "881": 40, "882": 40, "884": [40, 47], "949": 40, "055": 40, "157": [40, 47], "780": [40, 53], "953": [40, 47], "150": [40, 41, 53], "434": [40, 47], "786": 40, "8152": 40, "787": 40, "7878": 40, "9441": 40, "8699": 40, "8542": 40, "9011": 40, "9246": 40, "797": 40, "7136": 40, "798": 40, "802": [40, 47], "7683": 40, "805": [40, 47], "7996": 40, "806": [40, 47], "8230": 40, "2527": 40, "943": [40, 47], "2253": 40, "3074": 40, "955": [40, 47], "2917": 40, "3386": 40, "961": 40, "3621": 40, "962": [40, 41], "2429": 40, "964": 40, "2156": 40, "965": 40, "3718": 40, "966": [40, 47], "967": [40, 42, 47], "2976": 40, "968": 40, "2820": 40, "3289": 40, "970": 40, "3523": [40, 42], "859": 40, "static_map": 40, "553648128": 40, "142151": 40, "53912": 40, "26107": 40, "141023": 40, "141078": 40, "57008": 40, "10267": 40, "141925": 40, "309": [40, 47, 53], "140561": 40, "55499": 40, "362": [40, 42, 47, 55], "13614": 40, "14338": 40, "139972": 40, "54929": 40, "464": 40, "10246": 40, "141379": 40, "139553": 40, "56729": 40, "11698": 40, "141421": 40, "642": [40, 41], "139362": 40, "56153": 40, "696": 40, "11376": 40, "136499": 40, "138972": 40, "60721": 40, "811": 40, "11548": 40, "141355": 40, "138726": 40, "56329": 40, "10124": 40, "142614": 40, "139617": 40, "5483": 40, "14957": 40, "138442": 40, "138159": 40, "57499": 40, "ensembl": [41, 43, 55], "inferenceon": 41, "739": 41, "638": 41, "715": 41, "986": 41, "142": 41, "218": 41, "hps_demo": [41, 43], "reshape2": [41, 42, 51], "1100": [41, 51, 53], "ground_truth": 41, "2598678435": 41, "565": 41, "566": 41, "636": 41, "808": 41, "810": 41, "21845": 41, "0047": 41, "6921": 41, "0092": 41, "6824": 41, "207": [41, 47], "208": 41, "213": 41, "658": [41, 47], "444961": 41, "693355": 41, "508793": 41, "694358": 41, "422282": 41, "695494": 41, "764": 41, "175263": 41, "691037": 41, "174492": 41, "688767": 41, "503806": 41, "000913": 41, "093": [41, 42], "148": 41, "279": 41, "hps_demo_with_embed": 41, "hps_demo_dense_1000": 41, "sparse_model": [41, 55], "hps_demo0_sparse_1000": 41, "hps_demo1_sparse_1000": 41, "hps_demo_without_embed": 41, "parameterserverconfig": 41, "pd": [41, 45, 46, 49, 51], "onnxruntim": 41, "ort": 41, "key_offset": 41, "cumsum": 41, "ps_config": 41, "emb_table_nam": 41, "max_feature_num_per_sample_per_emb_t": 41, "inference_params_arrai": 41, "df": [41, 50, 53], "read_parquet": [41, 50, 51], "dense_input_column": 41, "cat_input1_column": 41, "cat_input2_column": 41, "loc": [41, 51], "to_numpi": 41, "cat_input1": 41, "cat_input2": 41, "embedding1": 41, "flatten": 41, "embedding2": 41, "get_output": 41, "input_fe": 41, "get_input": 41, "sess_ref": 41, "res_ref": 41, "pred_ref": 41, "diff_ref": 41, "mse_ref": 41, "18488": 41, "18470": 41, "4895492": 41, "509022": 41, "38192913": 41, "5264926": 41, "50650454": 41, "47927693": 41, "48954916": 41, "50902206": 41, "38192907": 41, "52649266": 41, "5065045": 41, "4792769": 41, "3887142e": 41, "566238532": 41, "3543": 41, "cleanunusedinitializersandnodearg": 41, "key_to_indice_hash_all_t": 41, "lookup_fromdlpack": [41, 55], "capsul": [41, 55], "to_dlpack": 41, "key_capsul": 41, "out_capsul": 41, "out_put": 41, "from_dlpack": 41, "runtimeerror": 41, "cuda_devic": 41, "is_avail": [41, 42], "10028": 41, "10004": 41, "0307": 41, "0264": 41, "0294": 41, "0151": 41, "0281": 41, "eager": 41, "out_tensor": 41, "out_dlcapsul": 41, "729218": 41, "182": [41, 42], "168630": 41, "1639": 41, "30048": 41, "170043": 41, "30184": 41, "171618": 41, "173095": 41, "174795": 41, "176299": 41, "177782": 41, "179411": 41, "20005": 41, "30047": 41, "20004": 41, "30001": 41, "20037": 41, "02182689": 41, "01806355": 41, "01985828": 41, "0136845": 41, "01738386": 41, "00323257": 41, "unix": 41, "primari": [41, 55], "secondari": 41, "multi_process_hp": 41, "multiprocess": [41, 46], "create_hp": 41, "num_max_process": 41, "subprocess": [41, 46], "getpid": 41, "await": 41, "sleep": 41, "eras": 41, "lost": 41, "delet": [41, 55], "revok": 41, "preserv": 41, "risidu": 41, "monitor": 41, "counter": 41, "destroi": 41, "far": 41, "1394": 41, "1397": 41, "270453215232": 41, "269706559488": 41, "17179868672": 41, "313": 41, "multiprocesshashmapbackend": [41, 55], "289": [41, 47, 53], "311": [41, 53], "281": 41, "282": 41, "260310085632": 41, "7783505728": 41, "463": [41, 47], "706": 41, "711": [41, 53], "842594773": 41, "3887142264200634e": 41, "497305659": 41, "101124718": 41, "176": [41, 42], "687": 41, "detach": [41, 47, 48], "progress": [41, 55], "mock": 41, "tar": [41, 47], "archiv": [41, 50], "rf": 41, "xf": 41, "sf": 41, "112": [41, 47], "443": 41, "sent": 41, "codeload": 41, "ref": 41, "gzip": [41, 42], "87m": 41, "50mb": 41, "3011655": 41, "tmr": 41, "mkreleasehdr": 41, "broken": [41, 55], "pipe": 41, "34mcc": 41, "33mmakefil": 41, "dep": 41, "sentinel": 41, "gcda": 41, "gcno": 41, "gcov": 41, "lcov": 41, "makefil": 41, "adlist": 41, "quicklist": 41, "ae": 41, "anet": 41, "sd": 41, "zmalloc": 41, "lzf_c": 41, "lzf_d": 41, "pqsort": 41, "zipmap": 41, "sha1": 41, "ziplist": 41, "replic": 41, "t_string": 41, "t_list": 41, "t_set": 41, "t_zset": 41, "t_hash": 41, "pubsub": 41, "intset": 41, "syncio": 41, "crc16": 41, "endianconv": 41, "slowlog": 41, "bio": 41, "rio": 41, "rand": [41, 49], "memtest": 41, "syscheck": 41, "crcspeed": 41, "crc64": 41, "bitop": 41, "notifi": 41, "setproctitl": 41, "hyperloglog": 41, "sparklin": 41, "geo": 41, "lazyfre": 41, "expir": 41, "geohash": 41, "geohash_help": 41, "childinfo": 41, "defrag": 41, "siphash": 41, "rax": 41, "t_stream": 41, "listpack": 41, "localtim": 41, "lolwut": 41, "lolwut5": 41, "lolwut6": 41, "acl": 41, "sha256": 41, "timeout": 41, "setcpuaffin": 41, "monoton": 41, "mt19937": 41, "resp_pars": 41, "call_repli": 41, "script_lua": 41, "function_lua": 41, "redisassert": 41, "cli_common": 41, "distclean": 41, "clean": [41, 42, 50, 55], "linenois": 41, "lua": 41, "jemalloc": 41, "hdr_histogram": 41, "leav": 41, "xo": 41, "commandfilt": 41, "testrdb": 41, "infotest": 41, "misc": 41, "hook": 41, "blockonkei": 41, "blockonbackground": 41, "scan": 41, "datatype2": 41, "auth": 41, "keyspace_ev": 41, "blockedcli": 41, "getkei": 41, "getchannel": 41, "test_lazyfre": 41, "defragtest": 41, "keyspec": 41, "zset": 41, "mallocs": 41, "aclcheck": 41, "subcommand": 41, "repli": 41, "cmdintrospect": 41, "eventloop": 41, "moduleconfig": 41, "moduleconfigstwo": 41, "usercal": 41, "pedant": 41, "dredis_stat": 41, "c11": [41, 53], "wall": [41, 50], "wno": 41, "o2": 41, "malloc": 41, "build_tl": 41, "use_systemd": 41, "cflag": 41, "ldflag": 41, "redis_cflag": 41, "redis_ldflag": 41, "prev_final_cflag": 41, "ggdb": 41, "duse_jemalloc": 41, "prev_final_ldflag": 41, "rdynam": 41, "1mmake": 41, "1mhiredi": 41, "c99": 41, "o3": 41, "fpic": 41, "wstrict": 41, "prototyp": 41, "wwrite": 41, "net": [41, 47, 48, 50], "sockcompat": 41, "rc": 41, "libhiredi": 41, "1mlinenois": 41, "1mlua": 41, "dlua_ansi": 41, "denable_cjson_glob": 41, "dlua_use_mkstemp": 41, "myldflag": 41, "lapi": 41, "lcode": 41, "ldebug": 41, "ldo": 41, "ldump": 41, "lfunc": 41, "lgc": 41, "llex": 41, "lmem": 41, "lobject": 41, "lopcod": 41, "lparser": 41, "lstate": 41, "lstring": 41, "ltabl": 41, "ltm": 41, "lundump": 41, "lvm": 41, "lzio": 41, "strbuf": 41, "fpconv": 41, "lauxlib": 41, "lbaselib": 41, "ldblib": 41, "liolib": 41, "lmathlib": 41, "loslib": 41, "ltablib": 41, "lstrlib": 41, "loadlib": 41, "linit": 41, "lua_cjson": 41, "lua_struct": 41, "lua_cmsgpack": 41, "lua_bit": 41, "liblua": 41, "dll": 41, "ranlib": 41, "lm": 41, "luac": 41, "1mhdr_histogram": 41, "dhdr_malloc_includ": 41, "hdr_redis_malloc": 41, "libhdrhistogram": 41, "1mjemalloc": 41, "g0": 41, "lg": 41, "quantum": 41, "je_": 41, "gnu99": 41, "g3": 41, "funrol": 41, "xsltproc": 41, "gcc": 41, "iso": 41, "c89": 41, "crai": 41, "gnu11": 41, "wextra": 41, "wshorten": 41, "wsign": 41, "wundef": 41, "preprocessor": 41, "libstdc": 41, "linkag": 41, "grep": 41, "egrep": 41, "ansi": 41, "stat": 41, "stdlib": 41, "inttyp": 41, "stdint": 41, "unistd": 41, "bigendian": 41, "void": 41, "intmax_t": 41, "pc": 41, "paus": 41, "nm": 41, "gawk": 41, "mawk": 41, "usabl": [41, 55], "presenc": 41, "malloc_usable_s": 41, "__attribute__": 41, "syntax": 41, "fvisibl": 41, "hidden": [41, 48], "werror": 41, "herror_on_warn": 41, "tls_model": 41, "alloc_s": 41, "gnu_printf": 41, "printf": 41, "bsd": 41, "ld": 41, "autoconf": 41, "memalign": 41, "valloc": 41, "backtrac": 41, "sbrk": 41, "utrac": 41, "__builtin_unreach": 41, "__builtin_ffsl": 41, "__builtin_popcountl": 41, "lg_page": 41, "pthread": 41, "pthread_creat": 41, "lpthread": 41, "dlfcn": 41, "dlsym": 41, "pthread_atfork": 41, "pthread_setname_np": 41, "clock_gettim": 41, "clock_monotonic_coars": 41, "clock_monoton": 41, "mach_absolute_tim": 41, "syscal": 41, "secure_getenv": 41, "sched_getcpu": 41, "sched_setaffin": 41, "issetugid": 41, "_malloc_thread_cleanup": 41, "_pthread_mutex_init_calloc_cb": 41, "__atom": 41, "__sync": 41, "darwin": 41, "osatom": 41, "madvis": 41, "madv_fre": 41, "madv_dontne": 41, "madv_do": 41, "nt": 41, "madv_": 41, "__builtin_clz": 41, "os_unfair_lock_": 41, "glibc": 41, "mutex": 41, "d_gnu_sourc": 41, "strerror_r": 41, "stdbool": 41, "conform": 41, "_bool": 41, "xsl": 41, "manpag": 41, "xml": 41, "jemalloc_macro": 41, "jemalloc_proto": 41, "jemalloc_typedef": 41, "jemalloc_preambl": 41, "jemalloc_test": 41, "stamp": 41, "jeprof": 41, "jemalloc_def": 41, "jemalloc_internal_def": 41, "jemalloc_test_def": 41, "public_symbol": 41, "private_symbol": 41, "awk": 41, "private_symbols_jet": 41, "public_namespac": 41, "public_unnamespac": 41, "jemalloc_protos_jet": 41, "jemalloc_renam": 41, "jemalloc_mangl": 41, "jemalloc_mangle_jet": 41, "revis": [41, 55], "configure_cflag": 41, "specified_cflag": 41, "extra_cflag": 41, "cppflag": 41, "d_reentrant": 41, "cxx": 41, "configure_cxxflag": 41, "specified_cxxflag": 41, "extra_cxxflag": 41, "extra_ldflag": 41, "dso_ldflag": 41, "wl": 41, "sonam": 41, "lstdc": 41, "rpath_extra": 41, "xslroot": 41, "bindir": 41, "datadir": 41, "includedir": 41, "libdir": 41, "mandir": 41, "man": 41, "srcroot": 41, "abs_srcroot": 41, "objroot": 41, "abs_objroot": 41, "jemalloc_prefix": 41, "jemalloc_private_namespac": 41, "install_suffix": 41, "malloc_conf": 41, "autogen": 41, "experimetal_smallocx": 41, "prof": 41, "libunwind": 41, "libgcc": 41, "xmalloc": 41, "lazy_lock": 41, "oblivi": 41, "libjemalloc": 41, "iinclud": 41, "djemalloc_no_private_namespac": 41, "sym": 41, "arena": 41, "background_thread": 41, "bitmap": 41, "ckh": 41, "ctl": 41, "div": 41, "extent": 41, "extent_dss": 41, "extent_mmap": 41, "malloc_io": 41, "mutex_pool": 41, "nstime": 41, "prng": 41, "rtree": 41, "safety_check": 41, "sc": 41, "sz": 41, "tcach": 41, "test_hook": 41, "ticker": 41, "tsd": 41, "wit": 41, "private_namespac": 41, "gen": 41, "cp": 41, "jemalloc_cpp": 41, "cru": 41, "33madlist": 41, "33mquicklist": 41, "33mae": 41, "33manet": 41, "33mdict": 41, "33mserver": 41, "33msd": 41, "33mzmalloc": 41, "33mlzf_c": 41, "33mlzf_d": 41, "33mpqsort": 41, "33mzipmap": 41, "33msha1": 41, "33mziplist": 41, "33mreleas": 41, "33mnetwork": 41, "33mutil": 41, "33mobject": 41, "33mdb": 41, "33mreplic": 41, "33mrdb": 41, "33mt_string": 41, "33mt_list": 41, "33mt_set": 41, "33mt_zset": 41, "33mt_hash": 41, "33mconfig": 41, "33maof": 41, "33mpubsub": 41, "33mmulti": 41, "33mdebug": 41, "33msort": 41, "33mintset": 41, "33msyncio": 41, "33mcluster": 41, "33mcrc16": 41, "33mendianconv": 41, "33mslowlog": 41, "33meval": 41, "33mbio": 41, "33mrio": 41, "33mrand": 41, "33mmemtest": 41, "33msyscheck": 41, "33mcrcspeed": 41, "33mcrc64": 41, "33mbitop": 41, "33msentinel": 41, "33mnotifi": 41, "33msetproctitl": 41, "33mblock": 41, "33mhyperloglog": 41, "33mlatenc": 41, "33msparklin": 41, "33mredi": 41, "33mgeo": 41, "33mlazyfre": 41, "33mmodul": 41, "33mevict": 41, "33mexpir": 41, "33mgeohash": 41, "33mgeohash_help": 41, "33mchildinfo": 41, "33mdefrag": 41, "33msiphash": 41, "33mrax": 41, "33mt_stream": 41, "33mlistpack": 41, "33mlocaltim": 41, "33mlolwut": 41, "33mlolwut5": 41, "33mlolwut6": 41, "33macl": 41, "33mtrack": 41, "33mconnect": 41, "33mtl": 41, "33msha256": 41, "33mtimeout": 41, "33msetcpuaffin": 41, "33mmonoton": 41, "33mmt19937": 41, "33mresp_pars": 41, "33mcall_repli": 41, "33mscript_lua": 41, "33mscript": 41, "33mfunction": 41, "33mfunction_lua": 41, "33mcommand": 41, "1mlink": 41, "1mredi": 41, "1minstal": 41, "33mredisassert": 41, "33mcli_common": 41, "hint": 41, "idea": 41, "conf": 41, "daemon": 41, "appendonli": 41, "7001": 41, "7002": 41, "shutdown": [41, 42, 55], "pkill": 41, "1m": 41, "0mmaster": 41, "5460": 41, "master": 41, "5461": 41, "10922": 41, "10923": 41, "16383": 41, "fa9bb82124685a6438a696cc1562693ccc815ff0": 41, "c6d7ad6353bf568d17a147e65b8198ded9d65717": 41, "5462": 41, "e26ae6cfbeea8a1e6367444445364d963ae17436": 41, "0mwait": 41, "0mm": 41, "coverag": 41, "num_node_connect": 41, "572": [41, 47], "redisclust": 41, "134": [41, 47, 53], "230052244": 41, "setupt": 41, "24mb": 41, "duse_openssl": 41, "use_ssl": 41, "dhiredis_test_ssl": 41, "libhiredis_ssl": 41, "encyrypt": 41, "test_cert": 41, "openssl": 41, "redis_serv": 41, "keyusag": 41, "digitalsignatur": 41, "keyencipher": 41, "hugectr_cli": 41, "nscerttyp": 41, "genrsa": 41, "public": 41, "rsa": 41, "pubout": 41, "dummi": 41, "req": 41, "x509": 41, "subj": 41, "cn": 41, "dai": [41, 42, 54], "cakei": 41, "caseri": 41, "ser": 41, "cacreateseri": 41, "extfil": 41, "subject": 41, "cert": 41, "cacert": 41, "a441806db5506b7600ee8ae794fa01dc31ac83c9": 41, "6fa93392a396aa3c321736234b7eafc86bb1f979": 41, "8e9cd68cc229fcb568a84d7358011201b4246046": 41, "644": [41, 47], "984": 41, "990": 41, "995": 41, "998": 41, "conclud": 41, "022623188": 41, "hugectr_e2": 42, "base_dir": 42, "data_dir": 42, "train_dir": 42, "val_dir": 42, "model_dir": 42, "decom": 42, "unzip": [42, 45], "filterwarn": 42, "simplefilt": 42, "dask_cudf": [42, 50], "dask_cuda": 42, "localcudaclust": 42, "dask": [42, 50], "device_mem_s": 42, "pynvml_mem_s": 42, "categorifi": [42, 50], "fillmiss": 42, "get_embedding_s": [42, 50, 51], "basicconfig": 42, "asctim": 42, "setlevel": 42, "notset": 42, "getlogg": 42, "asyncio": 42, "schema": [42, 50], "categorical_column": [42, 50], "continuous_column": 42, "label_column": [42, 50], "criteo_column": 42, "cross_column": 42, "c1_c2": 42, "c3_c4": 42, "num_integer_column": 42, "num_categorical_column": 42, "num_total_column": 42, "dashboard": 42, "dashboard_port": 42, "8787": 42, "tcp": 42, "visible_devic": 42, "delect": 42, "device_limit_frac": 42, "spill": 42, "device_pool_frac": 42, "part_mem_frac": 42, "device_s": 42, "device_limit": 42, "device_pool_s": 42, "part_siz": [42, 50], "fmem": 42, "1e9": 42, "bewar": 42, "n_worker": 42, "device_memory_limit": 42, "dashboard_address": 42, "rmm_pool_siz": 42, "061": 42, "preload": 42, "062": 42, "072": 42, "087": 42, "acc90f7f": 42, "fb72": 42, "11ed": 42, "808f": 42, "54ab3adac0a5": 42, "c0d46f34": 42, "503": 42, "789d4132": 42, "7d07": 42, "451f": 42, "ac": 42, "1867dfa9d7b3": 42, "comm": 42, "33423": 42, "40925": 42, "43851": 42, "nanni": 42, "40143": 42, "6pb36hck": 42, "40769": 42, "44353": 42, "43979": 42, "rv8itza6": 42, "45255": 42, "37165": 42, "46241": 42, "co2ru8ea": 42, "40555": 42, "37399": 42, "36117": 42, "04qjh_rt": 42, "39951": 42, "42631": 42, "46323": 42, "9zzs6cz6": 42, "40815": 42, "37909": 42, "40533": 42, "hq437puc": 42, "42963": 42, "41947": 42, "42201": 42, "kuwua5fi": 42, "39607": 42, "45371": 42, "39667": 42, "ouyeimq6": 42, "train_output": 42, "val_output": 42, "train_input": 42, "val_input": 42, "preprocess_dir_temp_train": 42, "preprocess_dir_temp_v": 42, "makedir": 42, "preprocess_dir_temp": 42, "cudf": [42, 50, 55], "one_path": 42, "rmtree": [42, 50], "train_valid_path": 42, "temp_output": 42, "ddf": 42, "read_csv": [42, 45, 46, 49], "sep": 42, "feature_pair": 42, "to_parquet": [42, 45, 49, 50], "train_path": [42, 50], "valid_path": [42, 50], "categorify_op": 42, "cat_featur": [42, 50], "cont_featur": 42, "min_valu": 42, "cross_cat_op": 42, "output_format": 42, "train_ds_iter": 42, "valid_ds_iter": 42, "per_partit": [42, 50], "dict_dtyp": [42, 50], "col": [42, 50], "transform": [42, 44, 47, 48, 50], "to_hugectr": 42, "output_path": [42, 50], "embeddings_dict_cat": 42, "embeddings_dict_cross": 42, "ndask": 42, "1234907": 42, "19683": 42, "13780": 42, "6867": 42, "18490": 42, "6264": 42, "1235": 42, "854680": 42, "114026": 42, "75736": 42, "2159": 42, "7533": 42, "1307783": 42, "404742": 42, "1105613": 42, "87714": 42, "9032": 42, "1577645": 42, "1093030": 42, "187256813049316": 42, "data_path": 42, "model_path": 42, "1581605": 42, "4000": [42, 51], "2720": 42, "1350": 42, "wide_redn": 42, "dropout2": 42, "add1": 42, "21000": 42, "mpiinitservic": 42, "4031005480": 42, "353": [42, 47], "355": 42, "475000": 42, "0018": 42, "7234": 42, "366": 42, "7175": 42, "7946054": 42, "6990506": 42, "0788": 42, "3132": 42, "392": 42, "7372800": 42, "396": [42, 47], "3516": 42, "5847": 42, "397": [42, 47], "2162": 42, "0056": 42, "3464": 42, "874": [42, 50], "429": [42, 53], "70458": 42, "124098": 42, "6176": 42, "130088": 42, "835": 42, "3000": [42, 51], "61959": 42, "101731": 42, "449": 42, "61009": 42, "110557": 42, "738497": 42, "47924": 42, "1046": 42, "10236": 42, "61852": 42, "102157": 42, "771": 42, "58452": 42, "123451": 42, "61023": 42, "122763": 42, "867": [42, 47], "698276": 42, "48087": 42, "487": 42, "0999177": 42, "103": [42, 47], "61106": 42, "0999892": 42, "722": 42, "11000": 42, "61545": 42, "0883301": 42, "348": [42, 53], "12000": [42, 55], "62134": 42, "0828304": 42, "688598": 42, "4733": 42, "13000": 42, "0717": 42, "108287": 42, "14000": 42, "62997": 42, "0745141": 42, "15000": 42, "60764": 42, "0720452": 42, "287": [42, 47], "16000": 42, "61101": 42, "0851126": 42, "758": 42, "685426": 42, "47088": 42, "17000": 42, "0865": 42, "0632745": 42, "18000": 42, "62825": 42, "0742994": 42, "626": 42, "19000": 42, "61035": 42, "0679226": 42, "230": 42, "59954": 42, "0779185": 42, "704": 42, "684045": 42, "4736": 42, "733": 42, "119": 42, "398": [42, 47], "611": 42, "903": [42, 47], "788": [42, 47], "5538": 42, "0770708": 42, "But": [43, 55], "development": 43, "repo": 43, "pybind11": 43, "hugectr_e2e_demo_with_nvtabular": 43, "continuous_train": 43, "multi_gpu_offline_infer": 43, "training_and_inference_with_remote_filesystem": 43, "modal": [43, 45, 46, 55], "movi": [43, 44, 45, 50, 52], "movielen": [43, 44, 50, 51, 52, 55], "25m": [43, 44, 46, 49, 52], "xiaolei": 43, "training_with_remote_filesystem": 43, "price": 44, "purchas": 44, "Such": 44, "rich": [44, 46], "poster": [44, 45, 52], "plot": [44, 46, 48], "synopsi": [44, 45, 52], "music": 44, "audio": 44, "lyric": 44, "itinerari": 44, "plan": [44, 55], "attract": 44, "photo": 44, "resnet": [44, 52], "bert": [44, 55], "pretrain": [44, 50], "enrich": [44, 45, 52], "etl": 44, "000": 45, "subsequ": 45, "sklearn": [45, 55], "model_select": 45, "train_test_split": 45, "download_fil": 45, "input_data_dir": [45, 50, 51], "ml": [45, 46, 49], "grouplen": 45, "movieid": [45, 46, 49, 50, 51], "genr": [45, 50], "toi": 45, "stori": 45, "1995": 45, "adventur": 45, "anim": 45, "children": [45, 47], "comedi": 45, "fantasi": 45, "jumanji": 45, "grumpier": 45, "old": [45, 55], "men": 45, "romanc": 45, "exhal": 45, "drama": 45, "father": 45, "bride": 45, "ii": 45, "movies_convert": [45, 50], "timestamp": [45, 55], "1147880044": 45, "1147868817": 45, "1147868828": 45, "665": 45, "1147878820": 45, "1147868510": 45, "simpl": [45, 49, 55], "test_siz": 45, "random_st": 45, "wish": [45, 46], "proce": [45, 46, 49], "sypnopsi": 46, "scrap": 46, "imdbpi": [46, 48], "ipython": [46, 47, 48], "do_shutdown": [46, 47, 48], "meta": 46, "ia": 46, "director": 46, "the_matrix": 46, "get_movi": 46, "0114709": [46, 47, 49], "get_movie_infoset": 46, "imdbid": [46, 49], "nuniqu": 46, "pickl": [46, 47, 48, 49], "cpu_count": 46, "basemanag": 46, "dictproxi": 46, "movies_id": 46, "movies_info": [46, 48], "movie_info": [46, 48], "risk": 46, "num_job": 46, "chunk_siz": 46, "proc": 46, "pkl": [46, 47, 48, 49], "highest_protocol": [46, 47, 48], "collect_large_post": 46, "filelist": [46, 47], "targetlist": 46, "largefilelist": 46, "largetargetlist": 46, "target_path": 46, "poster_smal": [46, 47], "jpg": [46, 47], "poster_larg": 46, "download_task": 46, "cmd": 46, "popen": 46, "wc": 46, "nvidia_resnet50": 47, "checkout": [47, 55], "5d6d417ff57e8824ef51573e00e5e21307b39697": 47, "classif": [47, 55], "convnet": 47, "pil": 47, "amp": 47, "autocast": 47, "image_classif": 47, "torchvis": [47, 48], "resnet50": 47, "resnext101_32x4d": 47, "se_resnext101_32x4d": 47, "efficientnet_b0": 47, "efficientnet_b4": 47, "efficientnet_widese_b0": 47, "efficientnet_widese_b4": 47, "efficientnet_quant_b0": 47, "efficientnet_quant_b4": 47, "available_model": 47, "load_jpeg_from_fil": 47, "image_s": 47, "img_transform": 47, "compos": 47, "resiz": 47, "centercrop": 47, "totensor": 47, "img": 47, "no_grad": [47, 48], "wherea": 47, "view": [47, 55], "229": [47, 53], "mono": 47, "channel": 47, "sub_": 47, "div_": 47, "check_quant_weight_correct": 47, "checkpoint_path": 47, "map_loc": 47, "startswith": 47, "quantizers_sd_kei": 47, "_amax": 47, "named_modul": 47, "quantiz": [47, 55], "sd_all_kei": 47, "imgnet_class": 47, "loc_synset_map": 47, "model_arg": 47, "pretrained_from_fil": 47, "nvidia_resnet50_200821": 47, "pth": 47, "resnet50_pyt_amp": 47, "hub": 47, "conv1": 47, "conv2d": 47, "kernel_s": 47, "bn1": 47, "batchnorm2d": 47, "momentum": [47, 55], "affin": 47, "track_running_stat": 47, "maxpool": 47, "maxpool2d": 47, "dilat": 47, "ceil_mod": 47, "conv2": 47, "bn2": 47, "conv3": 47, "bn3": 47, "downsampl": 47, "layer2": 47, "layer4": 47, "avgpool": 47, "adaptiveavgpool2d": 47, "output_s": 47, "61951": 47, "0055323": 47, "0274711": 47, "0055320": 47, "0054197": 47, "1791658": 47, "1288589": 47, "0365653": 47, "2324928": 47, "6000478": 47, "num_bathc": 47, "array_split": 47, "strip": 47, "feature_extractor": 47, "feature_dict": [47, 49], "unabl": 47, "0168199": 47, "0118926": 47, "0415856": 47, "0494260": 47, "0810772": 47, "02it": 47, "0049314": 47, "23it": 47, "0066831": 47, "29it": 47, "0888693": 47, "11it": 47, "0067431": 47, "21it": 47, "6522546": 47, "0057811": 47, "5176252": 47, "0112373": 47, "47it": 47, "4636254": 47, "41it": 47, "0365658": 47, "20it": 47, "2124046": 47, "0104469": 47, "14it": 47, "0102493": 47, "17it": 47, "0051792": 47, "65it": 47, "0110017": 47, "0139630": 47, "83it": 47, "0143348": 47, "92it": 47, "0037618": 47, "0040002": 47, "70it": 47, "0317950": 47, "52it": 47, "0850669": 47, "0325258": 47, "6569888": 47, "0037736": 47, "0109303": 47, "44it": 47, "0103882": 47, "59it": 47, "0267287": 47, "24it": 47, "0100033": 47, "43it": 47, "1601215": 47, "46it": [47, 51], "0092028": 47, "0075963": 47, "3267334": 47, "69it": 47, "0059398": 47, "78it": 47, "0122565": 47, "82it": 47, "0052572": 47, "102": [47, 53], "38it": 47, "6404896": 47, "28it": 47, "0027428": 47, "0033883": 47, "0113270": 47, "0022286": 47, "25it": 47, "0068953": 47, "13it": 47, "0042949": 47, "0130297": 47, "15it": 47, "0028207": 47, "0054244": 47, "10it": 47, "1275680": 47, "0036533": 47, "0037297": 47, "51it": 47, "0962736": 47, "0042548": 47, "34it": 47, "0038109": 47, "0104009": 47, "22it": 47, "0180316": 47, "26it": 47, "0071925": 47, "139": 47, "31it": 47, "0087001": 47, "0056910": 47, "0064563": 47, "1720040": 47, "149": 47, "0041112": 47, "16it": 47, "4412528": 47, "0051362": 47, "158": 47, "0029992": 47, "0384309": 47, "0028367": 47, "50it": 47, "0038336": 47, "32it": 47, "0058725": 47, "164": 47, "0113328": 47, "166": 47, "3878542": 47, "33it": 47, "0026465": 47, "0040588": 47, "0086984": 47, "178": 47, "40it": 47, "0309047": 47, "181": 47, "0031405": 47, "185": 47, "0097493": 47, "186": 47, "09it": 47, "0346336": 47, "0078841": 47, "0018795": 47, "9151704": 47, "1417097": 47, "0054223": 47, "0117477": 47, "199": 47, "64it": 47, "0000041": 47, "30it": 47, "0028907": 47, "0366179": 47, "0109761": 47, "217": 47, "39it": 47, "7167686": 47, "219": 47, "0048973": 47, "226": 47, "0100112": 47, "3606394": 47, "0021890": 47, "228": 47, "0033874": 47, "0035019": 47, "232": 47, "1228953": 47, "237": 47, "7688990": 47, "0052954": 47, "0092159": 47, "0094349": 47, "0065136": 47, "246": 47, "0027805": 47, "0034904": 47, "248": [47, 53], "18it": 47, "0037522": 47, "06it": 47, "0036301": 47, "254": [47, 53, 55], "0037324": 47, "35it": 47, "0053622": 47, "265": 47, "42it": 47, "7278178": 47, "266": 47, "37it": 47, "0418239": 47, "0040489": 47, "0069280": 47, "08it": 47, "0049143": 47, "0064840": 47, "285": [47, 50], "0070723": 47, "19it": 47, "0057997": 47, "0056072": 47, "7446332": 47, "0076618": 47, "04it": 47, "0290014": 47, "0347330": 47, "303": 47, "36it": 47, "0159620": 47, "304": 47, "0044667": 47, "07it": 47, "0040190": 47, "3088364": 47, "0230367": 47, "0037147": 47, "310": 47, "0033282": 47, "4028134": 47, "312": 47, "1352824": 47, "314": 47, "0079400": 47, "318": 47, "0449869": 47, "0047526": 47, "320": 47, "0095593": 47, "321": [47, 55], "2762334": 47, "322": 47, "0023293": 47, "0024593": 47, "327": 47, "1116182": 47, "328": [47, 53], "0063462": 47, "0119577": 47, "0106727": 47, "0053884": 47, "337": 47, "0037077": 47, "03it": 47, "0040064": 47, "0089108": 47, "0023129": 47, "347": 47, "0044827": 47, "12it": 47, "0067108": 47, "359": 47, "0432432": 47, "0202415": 47, "0074812": 47, "0059311": 47, "0065073": 47, "0052820": 47, "0120865": 47, "0064620": 47, "0068505": 47, "2934916": 47, "0040137": 47, "0071864": 47, "0072973": 47, "387": 47, "0449951": 47, "388": 47, "27it": 47, "0074605": 47, "0328955": 47, "0077294": 47, "393": [47, 53], "0987918": 47, "394": 47, "0067520": 47, "395": 47, "0220016": 47, "0067236": 47, "0085838": 47, "0047561": 47, "0066075": 47, "0123374": 47, "0026143": 47, "0064626": 47, "0822388": 47, "0101664": 47, "0403579": 47, "0070112": 47, "2323633": 47, "0203408": 47, "1167638": 47, "71it": 47, "0144178": 47, "48it": 47, "0295432": 47, "435": 47, "0123865": 47, "436": 47, "55it": 47, "0110530": 47, "0082817": 47, "45it": 47, "0067525": 47, "0046333": 47, "439": 47, "0248953": 47, "0000033": 47, "0069165": 47, "0000014": 47, "0000027": 47, "05it": 47, "0063531": 47, "0041431": 47, "0831387": 47, "3908598": 47, "0056341": 47, "3833520": 47, "472": 47, "0058660": 47, "0086847": 47, "0074455": 47, "477": 47, "0037990": 47, "481": 47, "1764600": 47, "0372764": 47, "0368576": 47, "0368574": 47, "0366178": 47, "484": 47, "0067118": 47, "488": 47, "0044954": 47, "496": 47, "0078950": 47, "498": 47, "0050957": 47, "0058374": 47, "499": 47, "0027963": 47, "507": 47, "0362590": 47, "508": 47, "0008309": 47, "509": 47, "0065240": 47, "0055022": 47, "0418753": 47, "0070768": 47, "1706680": 47, "518": 47, "3836530": 47, "0050545": 47, "61it": 47, "8752440": 47, "523": 47, "81it": [47, 48], "0019504": 47, "0060117": 47, "526": 47, "1172060": 47, "3280916": 47, "0039502": 47, "3800796": 47, "0074238": 47, "0062032": 47, "0053891": 47, "0184115": 47, "0060968": 47, "0075165": 47, "549": 47, "0076998": 47, "0060176": 47, "0092745": 47, "0079936": 47, "0060747": 47, "2523756": 47, "554": [47, 50], "0092217": 47, "0046906": 47, "0206226": 47, "0086484": 47, "0175471": 47, "0085913": 47, "0233687": 47, "0053214": 47, "0032794": 47, "0040765": 47, "0064541": 47, "0365109": 47, "569": 47, "0337721": 47, "0032234": 47, "0344604": 47, "574": 47, "0041349": 47, "53it": 47, "0180073": 47, "6926486": 47, "583": 47, "0079596": 47, "586": 47, "0140603": 47, "0069745": 47, "0066154": 47, "1745787": 47, "0045995": 47, "0038675": 47, "0068971": 47, "596": 47, "0050205": 47, "598": 47, "0085175": 47, "0424237": 47, "603": [47, 53], "0190524": 47, "3365778": 47, "8119752": 47, "0031742": 47, "610": 47, "0100465": 47, "614": 47, "0072097": 47, "0071771": 47, "0174997": 47, "0033676": 47, "623": [47, 53], "0443567": 47, "0047559": 47, "627": 47, "0260295": 47, "0200768": 47, "640": 47, "0245238": 47, "0075679": 47, "0042418": 47, "645": 47, "0036814": 47, "0079756": 47, "0983922": 47, "0058642": 47, "659": 47, "0116016": 47, "663": 47, "0092238": 47, "666": 47, "2226519": 47, "0414982": 47, "0419641": 47, "0040246": 47, "0217168": 47, "674": 47, "0038452": 47, "675": 47, "3155242": 47, "0038255": 47, "0043153": 47, "0072209": 47, "686": 47, "0074797": 47, "688": 47, "2720826": 47, "690": 47, "0068227": 47, "0372765": 47, "0083713": 47, "0252133": 47, "0329913": 47, "703": 47, "0036840": 47, "56it": 47, "0067956": 47, "2195566": 47, "708": 47, "0080549": 47, "714": [47, 53], "0073398": 47, "716": 47, "0038205": 47, "718": 47, "0117220": 47, "719": 47, "0046198": 47, "0060351": 47, "0081568": 47, "0046921": 47, "0034739": 47, "0023251": 47, "0491764": 47, "0090642": 47, "741": [47, 53], "0037928": 47, "743": 47, "0457430": 47, "0057283": 47, "0462519": 47, "0110546": 47, "0045197": 47, "0062523": 47, "750": 47, "0112454": 47, "0065243": 47, "0396171": 47, "0059710": 47, "0080928": 47, "0126004": 47, "1833116": 47, "770": 47, "0075766": 47, "0123860": 47, "0123970": 47, "0323120": 47, "0035301": 47, "1216520": 47, "0028331": 47, "1330015": 47, "0062443": 47, "0485241": 47, "0154467": 47, "776": 47, "5235348": 47, "0191074": 47, "0060168": 47, "779": 47, "0081738": 47, "0379473": 47, "0063381": 47, "4427076": 47, "0173714": 47, "3794028": 47, "0464106": 47, "0090570": 47, "0087829": 47, "0041866": 47, "0444682": 47, "0058110": 47, "0072392": 47, "0080546": 47, "0064482": 47, "809": 47, "0044599": 47, "0439771": 47, "58it": 47, "0021756": 47, "820": 47, "0039676": 47, "0160801": 47, "0032981": 47, "0049854": 47, "2605312": 47, "0367257": 47, "829": 47, "6817944": 47, "0082081": 47, "1146283": 47, "0796335": 47, "0183355": 47, "0218094": 47, "0290820": 47, "845": 47, "1059793": 47, "0025665": 47, "848": 47, "0259786": 47, "854": 47, "0044369": 47, "0031127": 47, "857": 47, "0283644": 47, "0316599": 47, "0118767": 47, "0059758": 47, "0122194": 47, "0070404": 47, "0028484": 47, "0166792": 47, "0369903": 47, "0073115": 47, "0284655": 47, "9236264": 47, "892": 47, "0137094": 47, "893": 47, "0064323": 47, "895": 47, "49it": 47, "0062741": 47, "68it": 47, "0084237": 47, "901": 47, "0084273": 47, "4193400": 47, "906": 47, "0124307": 47, "908": 47, "0157383": 47, "0412808": 47, "0161860": 47, "918": 47, "4613254": 47, "2788556": 47, "925": 47, "1437361": 47, "3037582": 47, "0048211": 47, "4516162": 47, "0033932": 47, "0042871": 47, "57it": 47, "0137799": 47, "62it": 47, "1714196": 47, "0025117": 47, "2357144": 47, "1525898": 47, "0098088": 47, "6537238": 47, "0303151": 47, "951": 47, "0315632": 47, "0316352": 47, "0166557": 47, "956": 47, "0066879": 47, "3736766": 47, "0140340": 47, "959": [47, 53], "1570970": 47, "0075364": 47, "0099901": 47, "447": 47, "movies_poster_featur": [47, 49], "61504": 47, "huggingfac": 48, "jupyterlab": 48, "nbclassic": 48, "admin": 48, "pip3": 48, "cu111": 48, "torchaudio": 48, "whl": 48, "torch_stabl": 48, "barttoken": 48, "bartmodel": 48, "facebook": 48, "decod": 48, "return_tensor": 48, "pt": 48, "truncat": 48, "max_length": 48, "output_hidden_st": 48, "last_hidden_st": 48, "62423": [48, 49, 51], "average_embed": 48, "movies_synopsis_embed": [48, 49], "proceed": 49, "poster_featur": 49, "61947": 49, "text_featur": 49, "61291": 49, "tmdbid": 49, "0113497": 49, "8844": 49, "0113228": 49, "15602": 49, "0114885": 49, "31357": 49, "0113041": 49, "11862": 49, "0105812": 49, "feature_arrai": 49, "iterrow": [49, 51], "2049": 49, "poster_feature_": 49, "text_feature_": 49, "3073": [49, 51], "feature_df": [49, 51], "datafram": [49, 50], "poster_feature_0": [49, 51], "poster_feature_1": [49, 51], "poster_feature_2": [49, 51], "poster_feature_3": [49, 51], "poster_feature_4": [49, 51], "poster_feature_5": [49, 51], "poster_feature_6": [49, 51], "poster_feature_7": [49, 51], "poster_feature_8": [49, 51], "text_feature_1014": [49, 51], "text_feature_1015": [49, 51], "text_feature_1016": [49, 51], "text_feature_1017": [49, 51], "text_feature_1018": [49, 51], "text_feature_1019": [49, 51], "text_feature_1020": [49, 51], "text_feature_1021": [49, 51], "text_feature_1022": [49, 51], "text_feature_1023": [49, 51], "088281": 49, "036760": 49, "006470": 49, "023553": 49, "000163": 49, "238797": 49, "291230": 49, "197272": 49, "024294": 49, "307049": 49, "789571": 49, "084938": 49, "187339": 49, "061683": 49, "183281": 49, "356245": 49, "289105": 49, "134672": 49, "691380": 49, "045417": 49, "051422": 49, "203168": 49, "617449": 49, "443821": 49, "501953": 49, "736949": 49, "180542": 49, "313696": 49, "274087": 49, "153105": 49, "218745": 49, "187553": 49, "904370": 49, "069441": 49, "026665": 49, "817211": 49, "125072": 49, "173140": 49, "209240": 49, "451933": 49, "491917": 49, "743956": 49, "069061": 49, "900011": 49, "583347": 49, "192817": 49, "224088": 49, "182279": 49, "014646": 49, "004135": 49, "197796": 49, "077938": 49, "215127": 49, "021160": 49, "023108": 49, "394012": 49, "679462": 49, "225475": 49, "196255": 49, "169627": 49, "008575": 49, "172138": 49, "114755": 49, "127861": 49, "003679": 49, "082123": 49, "447287": 49, "002375": 49, "135956": 49, "989514": 49, "808180": 49, "317510": 49, "176658": 49, "078992": 49, "726118": 49, "017430": 49, "249834": 49, "183357": 49, "071451": 49, "644567": 49, "090399": 49, "147284": 49, "pyarrow": 49, "pypi": [49, 55], "satisfi": 49, "33mwarn": 49, "upgrad": [49, 50, 55], "026260": [49, 51], "857608": [49, 51], "410247": [49, 51], "066654": [49, 51], "382803": [49, 51], "899998": [49, 51], "511562": [49, 51], "592291": [49, 51], "565434": [49, 51], "636716": [49, 51], "578369": [49, 51], "996169": [49, 51], "402107": [49, 51], "412318": [49, 51], "859952": [49, 51], "293852": [49, 51], "341114": [49, 51], "727113": [49, 51], "085829": [49, 51], "141265": [49, 51], "721758": [49, 51], "679958": [49, 51], "955634": [49, 51], "391091": [49, 51], "324611": [49, 51], "505211": [49, 51], "258331": [49, 51], "048264": [49, 51], "161505": [49, 51], "431864": [49, 51], "836532": [49, 51], "525013": [49, 51], "654566": [49, 51], "823841": [49, 51], "818313": [49, 51], "856280": [49, 51], "638048": [49, 51], "685537": [49, 51], "119418": [49, 51], "911146": [49, 51], "470762": [49, 51], "762258": [49, 51], "626335": [49, 51], "768947": [49, 51], "241833": [49, 51], "775992": [49, 51], "236340": [49, 51], "865548": [49, 51], "387806": [49, 51], "668321": [49, 51], "552122": [49, 51], "750238": [49, 51], "863707": [49, 51], "382173": [49, 51], "894487": [49, 51], "565142": [49, 51], "164083": [49, 51], "538184": [49, 51], "980678": [49, 51], "643513": [49, 51], "928519": [49, 51], "794906": [49, 51], "201022": [49, 51], "744666": [49, 51], "962188": [49, 51], "915320": [49, 51], "777534": [49, 51], "904200": [49, 51], "167337": [49, 51], "875194": [49, 51], "180481": [49, 51], "815904": [49, 51], "808288": [49, 51], "036711": [49, 51], "902779": [49, 51], "580946": [49, 51], "772951": [49, 51], "239788": [49, 51], "061874": [49, 51], "162997": [49, 51], "388310": [49, 51], "236311": [49, 51], "162757": [49, 51], "207134": [49, 51], "111078": [49, 51], "250022": [49, 51], "335043": [49, 51], "091674": [49, 51], "121507": [49, 51], "418124": [49, 51], "150020": [49, 51], "803506": [49, 51], "059504": [49, 51], "002342": [49, 51], "932321": [49, 51], "manipul": 50, "terabyt": [50, 55], "rapid": 50, "apt": 50, "graphviz": 50, "ubuntu": 50, "focal": 50, "inreleas": 50, "ppa": 50, "launchpad": 50, "deadsnak": 50, "backport": 50, "33m": 50, "newest": [50, 55], "3build2": 50, "libarchive13": 50, "librhash0": 50, "libuv1": 50, "autoremov": 50, "newli": [50, 55], "columngroup": 50, "column_nam": 50, "op1": 50, "op2": 50, "sound": 50, "joinextern": 50, "left": 50, "acycl": 50, "dag": 50, "visual": 50, "contigu": 50, "fulfil": 50, "v0": [50, 54], "movieid_dup": 50, "_duplic": 50, "lambdaop": 50, "int8": 50, "manifest": 50, "matter": 50, "solv": 50, "break": 50, "demand": [50, 55], "hood": 50, "decomposit": 50, "lazili": 50, "couldn": 50, "train_dataset": 50, "100mb": 50, "valid_dataset": 50, "640002432": 50, "troubleshoot": 50, "160000608": 50, "scikit": [50, 55], "981": 50, "0x7fbb086a3370": 50, "\u00b5": 50, "restor": [50, 55], "162542": [50, 51], "56586": [50, 51], "movieid_dupl": [50, 51], "part_0": 50, "26460": 50, "97438": 50, "1704": 50, "105574": 50, "3568": 50, "39464": 50, "127724": 50, "movie_map": 51, "movieid_s": 51, "56581": 51, "209155": 51, "56582": 51, "209157": 51, "56583": 51, "209159": 51, "56584": 51, "209169": 51, "56585": 51, "209171": 51, "set_index": 51, "num_token": 51, "embedding_matrix": 51, "3967": 51, "3072": 51, "17294852": 51, "15285189": 51, "26095702": 51, "75369112": 51, "29602144": 51, "78917433": 51, "13539355": 51, "84843078": 51, "70951219": 51, "10441725": 51, "72871966": 51, "11719463": 51, "18514273": 51, "72422918": 51, "04273015": 51, "1404219": 51, "54169348": 51, "96875489": 51, "08307642": 51, "3673532": 51, "15777258": 51, "01297393": 51, "36267638": 51, "14848055": 51, "82188376": 51, "56516905": 51, "70838085": 51, "45119769": 51, "9273439": 51, "42464321": 51, "henc": [51, 55], "shall": 51, "plu": 51, "pretrained_embedding_s": 51, "convert_pretrained_embeddings_to_sparse_model": 51, "pre_trained_sparse_embed": 51, "hugectr_pretrained_embed": 51, "afterward": [51, 55], "noqa": 51, "pretrained_embed": 51, "10001": 51, "476440390": 51, "275735": 51, "16384000": 51, "256000": 51, "1072": 51, "297110": 51, "581705": 51, "274680": 51, "574425": 51, "746443": 51, "054157": 51, "332273": 51, "564224": 51, "277900": 51, "550730": 51, "764630": 51, "054009": 51, "434429": 51, "536507": 51, "279014": 51, "525059": 51, "773702": 51, "054287": 51, "335757": 51, "532503": 51, "278661": 51, "526352": 51, "779897": 51, "167787": 51, "447136": 51, "547141": 51, "376035": 51, "548916": 51, "784775": 51, "054224": 51, "334735": 51, "540766": 51, "277728": 51, "515882": 51, "786808": 51, "054551": 51, "1300": 51, "336372": 51, "531510": 51, "1400": [51, 53], "277408": 51, "511901": 51, "791416": 51, "165986": 51, "1500": 51, "554217": 51, "522047": 51, "279548": 51, "540521": 51, "793460": 51, "054801": 51, "1700": 51, "336303": 51, "525447": 51, "1800": [51, 53], "278906": 51, "523558": 51, "793137": 51, "054431": 51, "1900": 51, "336023": 51, "511348": 51, "384979": 51, "515268": 51, "796599": 51, "172160": 51, "2100": 51, "453174": 51, "526615": 51, "2200": 51, "278781": 51, "536789": 51, "798459": 51, "054509": 51, "2300": 51, "335596": 51, "508902": 51, "2400": 51, "277901": 51, "520411": 51, "798726": 51, "054518": 51, "2500": 51, "444557": 51, "490832": 51, "2600": 51, "279310": 51, "507799": 51, "801325": 51, "164203": 51, "2700": 51, "443310": 51, "519460": 51, "277569": 51, "512426": 51, "800731": 51, "054590": 51, "2900": 51, "336213": 51, "512216": 51, "384833": 51, "522102": 51, "803801": 51, "054133": 51, "3100": 51, "334245": 51, "507463": 51, "279046": 51, "526148": 51, "802950": 51, "070003": 51, "3300": 51, "352114": 51, "504611": 51, "3400": 51, "277292": 51, "502907": 51, "804364": 51, "054315": 51, "3500": 51, "442956": 51, "512927": 51, "3600": 51, "277974": 51, "519042": 51, "806404": 51, "054291": 51, "3700": 51, "335365": 51, "499368": 51, "3800": 51, "277786": 51, "509683": 51, "805164": 51, "064908": 51, "3900": 51, "344106": 51, "508182": 51, "387872": 51, "493841": 51, "808367": 51, "054222": 51, "4100": 51, "335361": 51, "508106": 51, "278802": 51, "519000": 51, "808897": 51, "054320": 51, "4300": 51, "334094": 51, "502797": 51, "4400": 51, "388990": 51, "508890": 51, "809649": 51, "074584": 51, "355005": 51, "505778": 51, "4600": 51, "277275": 51, "532776": 51, "810962": 51, "054498": 51, "4700": 51, "335553": 51, "503001": 51, "4800": 51, "279237": 51, "495762": 51, "808618": 51, "4900": 51, "449926": 51, "503213": 51, "277141": 51, "481138": 51, "810767": 51, "064807": 51, "untrain": 51, "5100": 51, "630313": 51, "485568": 51, "5200": 51, "278359": 51, "518924": 51, "811217": 51, "054624": 51, "5300": 51, "336246": 51, "516505": 51, "5400": 51, "384571": 51, "512404": 51, "811464": 51, "054350": 51, "5500": 51, "334675": 51, "500305": 51, "5600": 51, "279563": 51, "484969": 51, "bart": 52, "din": [53, 55], "0bcb014209e219273cb6fd4152df7df713cbac61": 53, "25t09": 53, "53z": 53, "protoc": 53, "4b40fff8bb27201ba07b6fa5651217fb": 53, "jar": 53, "172": 53, "dlrm_parquet": 53, "supergroup": 53, "112247365": 53, "112243637": 53, "112251207": 53, "112241764": 53, "112247838": 53, "112244076": 53, "112253553": 53, "112249557": 53, "112239093": 53, "112249156": 53, "lastli": [53, 55], "label0": 53, "c5": 53, "c6": 53, "c7": 53, "c8": 53, "c9": 53, "c10": 53, "c12": 53, "c13": 53, "c14": 53, "c15": 53, "c16": 53, "c17": 53, "c18": 53, "c19": 53, "c20": 53, "c21": 53, "c22": 53, "c23": 53, "c24": 53, "c25": 53, "c26": 53, "c27": 53, "c28": 53, "c29": 53, "c30": 53, "c31": 53, "c32": 53, "c33": 53, "c34": 53, "c35": 53, "c36": 53, "c37": 53, "c38": 53, "c39": 53, "train_with_hdf": 53, "datasourcetype_t": 53, "405274": 53, "72550": 53, "55008": 53, "222734": 53, "316071": 53, "156265": 53, "220243": 53, "200179": 53, "234566": 53, "335625": 53, "278726": 53, "263070": 53, "312542": 53, "203773": 53, "145859": 53, "117421": 53, "78140": 53, "3648": 53, "156308": 53, "94562": 53, "357703": 53, "386976": 53, "238046": 53, "230917": 53, "156382": 53, "10720": 53, "502": 53, "3218787045": 53, "607": 53, "529": 53, "530": 53, "a10": 53, "21954560": 53, "010000": 53, "716815": 53, "69327": 53, "856": 53, "719486": 53, "693207": 53, "750294": 53, "693568": 53, "721128": 53, "693352": 53, "78435": 53, "499891": 53, "5486": 53, "2728": 53, "693178": 53, "720984": 53, "693292": 53, "756448": 53, "693053": 53, "725832": 53, "693433": 53, "382": 53, "77763": 53, "693193": 53, "500092": 53, "57548": 53, "575": 53, "0_sparse_2000": 53, "_dense_2000": 53, "_opt_dense_2000": 53, "430": 53, "drwxr": 53, "xr": 53, "9479684": 53, "functionalit": 53, "dcn_parquet": 53, "train_with_s3": 53, "east": [53, 55], "39884": 53, "39043": 53, "17289": 53, "7420": 53, "20263": 53, "7120": 53, "1543": 53, "slice12": 53, "amazonaw": [53, 55], "pipeline_test": 53, "dcn_model": 53, "569406237": 53, "822": 53, "710": 53, "713": 53, "397821": 53, "2457600": 53, "1453": 53, "25574": 53, "712926": 53, "16987": 53, "701584": 53, "22653": 53, "696012": 53, "16121": 53, "698167": 53, "42367": 53, "695641": 53, "500979": 53, "0735": 53, "6575": 53, "696028": 53, "03696": 53, "693602": 53, "089": 53, "73903": 53, "693618": 53, "10101": 53, "696232": 53, "59704": 53, "50103": 53, "5882": 53, "473": 53, "0_sparse_1000": 53, "_dense_1000": 53, "_opt_dense_1000": 53, "843": 53, "988": 53, "denable_gc": 53, "enable_gc": 53, "gcp": 53, "credenti": 53, "environment": 53, "google_application_credenti": 53, "gcs_kei": 53, "train_with_gc": 53, "1008636636": 53, "308": 53, "323": 53, "236": 53, "22452": 53, "786299": 53, "6347": 53, "738846": 53, "22938": 53, "711017": 53, "63355": 53, "708317": 53, "850": 53, "11226": 53, "697101": 53, "501301": 53, "0298": 53, "6054": 53, "698077": 53, "744573": 53, "697804": 53, "244": 53, "04207": 53, "695543": 53, "761465": 53, "695323": 53, "28151": 53, "695319": 53, "647": 53, "501347": 53, "3576": 53, "664": 53, "804": 53, "submiss": 54, "ve": [54, 55], "billion": 54, "curv": 54, "dual": 54, "dgx1": 54, "emb_dim": 54, "6x": 54, "criteolab": 54, "criteo_script": [54, 55], "criteo2hugectr": 54, "tfrecord": 54, "chart": 54, "seven": 54, "exhibit": 54, "incremental_dump": 55, "illeg": 55, "hierarh": 55, "inconsist": 55, "anymor": 55, "export_predict": 55, "legaci": 55, "corner": 55, "nan": 55, "occasion": 55, "thousand": 55, "happen": 55, "cub": 55, "workaround": 55, "rmm": 55, "mr": 55, "set_current_device_resourc": 55, "356": 55, "hctr_rmm_settabl": 55, "cautiou": 55, "1g": 55, "243": 55, "kafkaproduc": 55, "succe": 55, "unrespons": 55, "reachabl": 55, "joint": 55, "suit": 55, "omit": 55, "futr": 55, "hierarchicalkv": 55, "cmakelist": 55, "minor": 55, "duse_cudart_stat": 55, "torchscript": 55, "coupl": 55, "regress": 55, "unnessari": 55, "h800": 55, "fp8": 55, "dequant": 55, "x86": 55, "superchip": 55, "hand": 55, "_concat_": 55, "dense_embed": 55, "refin": 55, "devicesegmentedsort": 55, "devicesegmentedradixsort": 55, "led": 55, "datadistributor": 55, "fly": 55, "member": 55, "elimin": 55, "parquet_reader_opt": 55, "set_num_row": 55, "pr": 55, "core23": 55, "hctr_print": 55, "did": 55, "cmak": 55, "ing": 55, "clarifi": 55, "refactor": 55, "dynamic_vari": 55, "adamax": 55, "adadelta": 55, "fault": 55, "wrong": 55, "fusion": 55, "cudadevicesynchron": 55, "embeddingtablecollect": 55, "utest": 55, "unfus": 55, "analayz": 55, "stress": 55, "crosslay": 55, "backpropag": 55, "move": 55, "denselayerswitch": 55, "unfamiliar": 55, "nic": 55, "python_interfac": 55, "strengthen": 55, "datasest": 55, "is_exclusive_kei": 55, "nob": 55, "sparseparam": 55, "misus": 55, "clearer": 55, "violat": 55, "newer": 55, "wdl_predict": 55, "januari": 55, "calendar": 55, "v23": 55, "bst": 55, "conceptu": 55, "arxiv": 55, "ab": 55, "2008": 55, "13535": 55, "redisclusterbackend": 55, "prop": 55, "test_embedding_table_optim": 55, "embedding_collect": 55, "clariti": 55, "bind": 55, "recov": 55, "sometim": 55, "problem": 55, "failur": 55, "macro": 55, "reiniti": 55, "end_offset": 55, "deeprec": 55, "embeddingplann": 55, "embedding_collection_test": 55, "db_type": 55, "boundari": 55, "hierarchc": 55, "co": 55, "round": 55, "trip": 55, "mlplayer": 55, "dgx_a100_mlp": 55, "preprocess_censu": 55, "mmoe": 55, "replicacontext": 55, "4_nvt_process": 55, "dgx_a100_ib_nvlink": 55, "dlpack": 55, "odd": 55, "sector": 55, "unreport": 55, "leak": 55, "table_group_strategi": 55, "table_placement_strategi": 55, "mmoe_parquet": 55, "simplif": 55, "mybucket": 55, "graphic": 55, "epilogu": 55, "corrupt": 55, "improp": 55, "io_block_s": 55, "max_nr_request": 55, "stabliz": 55, "globalembeddingdata": 55, "localembeddingdata": 55, "mention": 55, "bullet": 55, "ratio": 55, "subset": 55, "durat": 55, "hadoopfilesystem": 55, "hadoop_filesystem": 55, "hpp": 55, "third_parti": 55, "finer": 55, "deperac": 55, "overlapped_pipelin": 55, "triton_tf_deploi": 55, "cucollect": 55, "embedding_storag": 55, "dynamic_embedding_storag": 55, "interoper": 55, "slurm": 55, "305": 55, "482141": 55, "440781": 55, "46146124601364136": 55, "databasebackend": 55, "budget": 55, "nanosecond": 55, "strict": 55, "caller": 55, "unprocess": 55, "callback": 55, "load_dump": 55, "sst": 55, "find_tabl": 55, "discov": 55, "routin": 55, "inlin": 55, "340": 55, "concept": 55, "matrixmultipli": 55, "goal": 55, "navig": 55, "multiplex": 55, "gbp": 55, "upsert": 55, "diminish": 55, "recal": 55, "4x": 55, "rather": 55, "safer": 55, "ndcg": 55, "smape": 55, "extractor": 55, "261": 55, "inspir": 55, "roc_auc_scor": 55, "unweight": 55, "release_not": 55, "reorgan": 55, "dlrm_kaggle_fp32": 55, "36672493": 55, "301": 55, "standalon": 55, "prodvid": 55, "decoupl": 55, "realli": 55, "embedding_workspace_calcul": 55, "qa": 55, "codebas": 55, "relev": 55, "model_analyz": 55, "won": 55, "bare": 55, "notic": 55, "lessen": 55, "dlrm_benchmark": 55, "uint32_t": 55, "int64_t": 55, "uint32": 55, "all2alldenseembed": 55, "embedding_initi": 55, "randomuniform": 55, "readabl": 55, "robust": 55, "resolut": 55, "recycl": 55, "unload": 55, "invok": 55, "conda": 55, "event": 55, "notebok": 55, "inaccur": 55, "parameter": 55, "meaning": 55, "jabber": 55, "uniformli": 55, "interleav": 55, "shouldn": 55, "graphschedul": 55, "grapschedul": 55, "cudagraph": 55, "gap": 55, "adjac": 55, "grain": 55, "frozen": 55, "unfrozen": 55, "worri": 55, "gpu_cach": 55, "oversubscript": 55, "hmem": 55, "mo": 55, "use_host_memory_p": 55, "ps_type": 55, "vice": 55, "versa": 55, "famili": 55, "poc": 55, "assist": 55, "explain": 55, "involv": 55, "netwoek": 55, "fusedrelubiasfullyconnectedlay": 55, "holist": 55, "use_overlapped_pipelin": 55, "use_hash_t": 55, "multiworkermirroredstrategi": 55, "concret": 55, "ncf": 55, "gmf": 55, "neumf": 55, "dien": 55, "paraquet": 55, "moment": 55, "stand": 55, "alon": 55, "dotproduct": 55, "__half2": 55, "vocabulary_s": 55, "streamlin": 55, "grasp": 55, "embedding_plugin": 55, "localizedslotsparseembeddinghashonehot": 55, "claus": 55, "max_eval_sampl": 55, "multiplylay": 55, "weightmultiplylay": 55, "perl": 55, "embeddinglay": 55, "helper": 55, "coars": 55, "tensorfloat": 55, "mantissa": 55, "expon": 55, "redesign": 55, "multinod": 55, "hugectr_user_guid": 55, "preprocess_nvt": 55, "hasn": 55, "dl": 56, "vast": 56, "broad": 56, "balanc": 56, "littl": 56}, "objects": {"hierarchical_parameter_server": [[8, 0, 1, "", "Init"], [9, 1, 1, "", "LookupLayer"], [9, 1, 1, "", "SparseLookupLayer"]], "hierarchical_parameter_server.LookupLayer": [[9, 2, 1, "", "call"]], "hierarchical_parameter_server.SparseLookupLayer": [[9, 2, 1, "", "call"]]}, "objtypes": {"0": "py:function", "1": "py:class", "2": "py:method"}, "objnames": {"0": ["py", "function", "Python function"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"]}, "titleterms": {"question": 0, "answer": 0, "1": [0, 30, 41, 43, 54, 55], "who": 0, "ar": 0, "target": 0, "user": 0, "hugectr": [0, 2, 3, 4, 25, 29, 31, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 51, 53, 54], "2": [0, 30, 41, 43, 54, 55], "which": 0, "model": [0, 4, 5, 6, 20, 21, 22, 26, 27, 30, 31, 32, 33, 36, 40, 42, 48, 51, 53], "can": 0, "support": [0, 36], "3": [0, 30, 41, 43, 55], "doe": 0, "tensorflow": [0, 10, 24, 30, 33, 54], "4": [0, 30, 41, 43, 55], "multipl": [0, 21, 33], "node": [0, 36], "ctr": 0, "train": [0, 4, 5, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33, 35, 36, 40, 41, 42, 44, 45, 51, 53], "5": [0, 30, 41, 55], "how": [0, 35], "deal": 0, "huge": 0, "embed": [0, 2, 5, 19, 22, 26, 27, 30, 40, 41, 48, 51], "tabl": [0, 19, 21, 23, 28, 30, 40], "cannot": 0, "store": [0, 49], "singl": 0, "gpu": [0, 33, 47], "memori": 0, "6": [0, 55], "7": [0, 55], "must": 0, "we": 0, "us": [0, 2, 10, 13, 17, 19, 24, 30, 31, 32, 33, 38, 40, 42], "dgx": [0, 54], "famili": 0, "a100": [0, 54], "run": [0, 30, 40, 43, 50], "8": [0, 55], "without": [0, 41], "infiniband": 0, "9": [0, 55], "i": 0, "ani": 0, "requir": 0, "cpu": 0, "configur": [0, 5, 20, 21, 22, 24, 26, 27, 30, 31, 32, 33], "execut": [0, 5], "10": 0, "what": [0, 55], "specif": [0, 25, 29, 34, 43], "format": [0, 4, 30], "file": [0, 4, 30, 31, 32, 33, 53], "input": [0, 2, 21, 30], "11": [0, 55], "python": [0, 4], "interfac": [0, 4], "12": [0, 55], "do": [0, 30, 31, 32, 33], "synchron": 0, "otherwis": 0, "asynchron": 0, "13": 0, "stream": 0, "14": 0, "slot": 0, "15": 0, "differ": 0, "between": 0, "localizedslotembed": 0, "distributedslotembed": 0, "16": 0, "For": 0, "multi": [0, 36, 41, 44, 49, 52], "dataread": [0, 4], "read": 0, "same": 0, "batch": 0, "data": [0, 4, 28, 30, 31, 38, 40, 41, 42, 44, 46, 49, 53], "each": 0, "step": [0, 30, 45], "17": 0, "As": 0, "parallel": [0, 36], "layer": [0, 2, 4, 9, 20, 21, 22, 24, 26, 27, 33, 51], "get": [0, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 45], "all": [0, 46, 47, 48], "lookup": [0, 5, 28, 41], "featur": [0, 36, 47, 48, 49, 51], "from": [0, 20, 21, 22, 23, 24, 26, 27, 28, 30, 34, 35, 38, 41, 46, 47], "18": 0, "set": [0, 35], "claus": 0, "two": 0, "need": 0, "19": 0, "save": [0, 20, 21, 26], "load": [0, 22, 51], "20": 0, "could": 0, "post": 0, "import": 0, "other": 0, "framework": 0, "infer": [0, 4, 5, 20, 21, 23, 24, 26, 30, 35, 41], "deploy": [0, 41], "21": 0, "overlap": 0, "22": 0, "": [0, 48, 54, 55], "valu": 0, "23": [0, 55], "benchmark": [0, 6, 10, 17, 30, 38], "my": 0, "network": 0, "24": [0, 55], "workspace_size_per_gpu_in_mb": 0, "slot_size_arrai": 0, "25": 0, "nvlink": 0, "26": 0, "onli": 0, "server": [0, 5, 7, 10, 13, 17, 18, 20, 25, 29, 30, 36, 41], "27": 0, "28": 0, "pretrain": [0, 22, 47, 48, 51], "29": 0, "construct": 0, "graph": [0, 20, 21, 24, 26, 30, 31, 32, 33], "branch": 0, "topologi": 0, "30": 0, "good": 0, "practic": 0, "vector": [0, 41], "size": 0, "31": 0, "resolv": 0, "bu": 0, "error": 0, "when": 0, "sampl": 0, "notebook": [0, 10, 13, 17, 25, 29, 34, 40, 43, 52], "32": 0, "log": 0, "pool": 0, "empti": 0, "impli": 0, "addit": 1, "resourc": [1, 6, 39], "class": [2, 4, 12], "method": [2, 4], "spars": [2, 21, 32, 33, 35, 36, 56], "type": 2, "detail": 2, "distributedslotsparseembeddinghash": 2, "localizedslotsparseembeddinghash": 2, "localizedslotsparseembeddingonehot": 2, "dens": 2, "usag": 2, "fullyconnect": 2, "mlp": 2, "multicross": 2, "fmorder2": 2, "weightmultipli": 2, "elementwisemultipli": 2, "batchnorm": 2, "layernorm": 2, "concat": 2, "reshap": 2, "select": 2, "slice": 2, "dropout": 2, "elu": 2, "relu": 2, "sigmoid": 2, "interact": 2, "add": [2, 4], "reducesum": 2, "gru": 2, "preludic": 2, "scale": 2, "fusedreshapeconcat": 2, "fusedreshapeconcatgener": 2, "softmax": 2, "sub": 2, "reducemean": 2, "matrixmutipli": 2, "multiheadattent": 2, "sequencemask": 2, "gather": 2, "binarycrossentropyloss": 2, "crossentropyloss": 2, "multicrossentropyloss": 2, "collect": [2, 40, 46], "about": [2, 4, 38, 40], "overview": [2, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 35, 41, 42, 44, 53], "known": [2, 55], "limit": 2, "embeddingtableconfig": 2, "embeddingcollectionconfig": 2, "embedding_lookup": 2, "shard": 2, "api": [3, 4, 7, 11, 16, 40], "document": 3, "high": 4, "level": 4, "solver": 4, "createsolv": 4, "asyncparam": 4, "hybridembeddingparam": 4, "datareaderparam": 4, "dataset": [4, 38, 45], "list": [4, 25, 29, 34, 43], "raw": 4, "parquet": 4, "optparamspi": 4, "createoptim": 4, "compil": 4, "fit": 4, "summari": [4, 36], "graph_to_json": 4, "construct_from_json": 4, "load_dense_weight": 4, "load_dense_optimizer_st": 4, "load_sparse_weight": 4, "load_sparse_optimizer_st": 4, "freeze_dens": 4, "freeze_embed": 4, "unfreeze_dens": 4, "unfreeze_embed": 4, "reset_learning_rate_schedul": 4, "set_sourc": 4, "low": 4, "learningrateschedul": 4, "get_next": 4, "is_eof": 4, "get_learning_rate_schedul": 4, "get_data_reader_train": 4, "get_data_reader_ev": 4, "start_data_read": 4, "set_learning_r": 4, "get_current_loss": 4, "eval": 4, "get_eval_metr": 4, "save_params_to_fil": 4, "check_out_tensor": 4, "inferenceparam": 4, "inferencemodel": 4, "predict": 4, "evalu": [4, 54], "gener": [4, 28, 31, 38, 41], "datageneratorparam": 4, "datagener": 4, "sourc": [4, 5, 35], "datasourceparam": 4, "hierarch": [5, 7, 10, 13, 17, 18, 20, 25, 29, 36, 41], "paramet": [5, 7, 10, 13, 17, 18, 20, 25, 29, 36, 41], "databas": 5, "backend": [5, 24], "introduct": [5, 10, 13, 17, 38], "hp": [5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 26, 28, 30, 31, 32, 33, 34, 41], "background": 5, "architectur": 5, "iter": 5, "updat": 5, "optim": [5, 36], "cach": 5, "param": 5, "syntax": 5, "volatil": 5, "overflow": 5, "common": 5, "persist": 5, "dlrm": [6, 26, 27, 40, 53], "setup": [6, 40, 41, 42, 53], "result": [6, 19], "initi": 8, "sparselookuplay": [9, 21, 26], "lookuplay": [9, 12, 20, 21, 24], "plugin": [10, 11, 12, 13, 14, 15, 16, 17, 30, 31, 32, 33, 34], "benefit": 10, "workflow": [10, 17], "instal": [10, 13, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 38], "comput": [10, 13, 17, 38], "capabl": [10, 13, 17, 38], "ngc": [10, 13, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 43], "contain": [10, 13, 17, 30, 34, 35, 38], "exampl": [10, 13, 17, 42, 43, 52, 53], "torch": [11, 12, 13, 28], "creator": 15, "tensorrt": [16, 17, 30, 31, 32, 33, 34], "profil": 19, "build": [19, 27, 30, 31, 32, 33, 35, 38, 43], "creat": [19, 20, 21, 23, 24, 26, 30, 49], "synthet": [19, 38, 49], "measur": 19, "triton": [19, 24, 30, 31, 32, 33], "perf": 19, "analyz": 19, "v": 19, "demo": [20, 22, 23, 26, 27, 28, 31, 32, 33, 41], "nativ": [20, 21, 22, 24, 33], "tf": [20, 21, 22, 23, 24, 30, 33], "pre": [22, 50, 51], "via": 22, "fusion": [23, 28], "savedmodel": [23, 24], "make": 23, "deploi": [24, 31, 32, 33], "trt": 24, "quickstart": [25, 29, 34], "pull": [25, 29, 34, 43], "docker": [25, 29, 30, 43], "clone": [25, 29, 34, 43], "repositori": [25, 29, 30, 34, 43], "start": [25, 29, 34, 35, 43, 45], "jupyt": [25, 29, 34, 43], "system": [25, 29, 30, 34, 43, 44, 53], "sok": [26, 27, 35], "larg": 30, "integr": [30, 31, 32, 33], "engin": [30, 31, 32, 33], "step1": [30, 31, 32, 33], "prepar": [30, 31, 32, 33, 40, 42, 53], "147gb": 30, "scratch": [30, 38, 41], "step2": [30, 31, 32, 33], "json": [30, 31, 32, 33], "step3": [30, 31, 32, 33], "convert": [30, 31, 32, 33, 36, 41, 45], "onnx": [30, 31, 32, 33, 36, 41], "surgeri": [30, 31, 32, 33], "step4": 30, "launch": 30, "arm64": 30, "grace": 30, "hooper": 30, "nvidia": [30, 47], "merlin": [30, 35, 39], "imag": 30, "host": 30, "pytorch": 32, "contribut": 35, "new": [35, 55], "code": 35, "your": 35, "develop": 35, "up": 35, "environ": 35, "With": 35, "oper": [35, 36, 56], "kit": [35, 36, 56], "core": 36, "mix": 36, "precis": 36, "sgd": 36, "learn": 36, "rate": 36, "schedul": 36, "hdf": [36, 53], "talk": 37, "blog": 37, "tool": 38, "download": [38, 45, 47, 48], "preprocess": [38, 42, 50], "relat": 39, "thi": 40, "concept": 40, "refer": 40, "an": 40, "follow": 40, "command": 40, "termin": 40, "script": 40, "placement": 40, "strategi": 40, "round": 40, "robin": 40, "uniform": 40, "hybrid": 40, "dynam": 40, "hash": 40, "dlpack": 41, "process": [41, 50], "redi": 41, "cluster": 41, "tl": 41, "ssl": 41, "end": 42, "nvtabular": [42, 50], "wdl": 42, "custom": 43, "option": 43, "recommend": 44, "modal": [44, 49, 52], "movielen": [45, 46], "25m": 45, "split": 45, "valid": 45, "next": 45, "enrich": 46, "scrape": 46, "imdb": 46, "synopsi": [46, 48], "movi": [46, 47, 48, 49, 51], "poster": [46, 47], "extract": [47, 48], "resnet": 47, "50": 47, "cloud": [47, 53], "bart": 48, "text": 48, "summar": 48, "real": 49, "etl": 50, "defin": [50, 51], "our": 50, "pipelin": 50, "check": 50, "output": 50, "non": 51, "trainabl": 51, "remot": 53, "dcn": 53, "aw": 53, "s3": 53, "googl": 53, "storag": 53, "perform": 54, "mlperf": 54, "releas": 55, "note": 55, "version": 55, "06": 55, "08": 55, "04": 55, "02": 55, "0": 55, "issu": 55}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx.ext.intersphinx": 1, "sphinx": 57}, "alltitles": {"Questions and Answers": [[0, "questions-and-answers"]], "1. Who are the target users of HugeCTR?": [[0, "who-are-the-target-users-of-hugectr"]], "2. Which models can be supported in HugeCTR?": [[0, "which-models-can-be-supported-in-hugectr"]], "3. Does HugeCTR support TensorFlow?": [[0, "does-hugectr-support-tensorflow"]], "4. Does HugeCTR support multiple nodes CTR training?": [[0, "does-hugectr-support-multiple-nodes-ctr-training"]], "5. How to deal with the huge embedding table that cannot be stored in a single GPU memory?": [[0, "how-to-deal-with-the-huge-embedding-table-that-cannot-be-stored-in-a-single-gpu-memory"]], "6. Which GPUs are supported in HugeCTR?": [[0, "which-gpus-are-supported-in-hugectr"]], "7. Must we use the DGX family such as DGX A100 to run HugeCTR?": [[0, "must-we-use-the-dgx-family-such-as-dgx-a100-to-run-hugectr"]], "8. Can HugeCTR run without InfiniBand?": [[0, "can-hugectr-run-without-infiniband"]], "9. Is there any requirement of CPU configuration for HugeCTR execution?": [[0, "is-there-any-requirement-of-cpu-configuration-for-hugectr-execution"]], "10. What is the specific format of files as input in HugeCTR?": [[0, "what-is-the-specific-format-of-files-as-input-in-hugectr"]], "11.\t Does HugeCTR support Python interface?": [[0, "does-hugectr-support-python-interface"]], "12. Does HugeCTR do synchronous training with multiple GPUs (and nodes)? Otherwise, does it do asynchronous training?": [[0, "does-hugectr-do-synchronous-training-with-multiple-gpus-and-nodes-otherwise-does-it-do-asynchronous-training"]], "13. Does HugeCTR support stream training?": [[0, "does-hugectr-support-stream-training"]], "14. What is a \u201cslot\u201d in HugeCTR?": [[0, "what-is-a-slot-in-hugectr"]], "15. What are the differences between LocalizedSlotEmbedding and DistributedSlotEmbedding?": [[0, "what-are-the-differences-between-localizedslotembedding-and-distributedslotembedding"]], "16. For multi-node\uff0cis DataReader required to read the same batch of data on each node for each step?": [[0, "for-multi-node-is-datareader-required-to-read-the-same-batch-of-data-on-each-node-for-each-step"]], "17. As model parallelism in embedding layers, how does it get all the embedding lookup features from multi-node / multi-gpu?": [[0, "as-model-parallelism-in-embedding-layers-how-does-it-get-all-the-embedding-lookup-features-from-multi-node-multi-gpu"]], "18. How to set data clauses, if there are two embeddings needed?": [[0, "how-to-set-data-clauses-if-there-are-two-embeddings-needed"]], "19. How to save and load models in HugeCTR?": [[0, "how-to-save-and-load-models-in-hugectr"]], "20. Could the post training model from HugeCTR be imported into other frameworks such as TensorFlow for inference deployment?": [[0, "could-the-post-training-model-from-hugectr-be-imported-into-other-frameworks-such-as-tensorflow-for-inference-deployment"]], "21. Does HugeCTR support overlap between different slots?": [[0, "does-hugectr-support-overlap-between-different-slots"]], "22. What if there\u2019s no value in a slot?": [[0, "what-if-there-s-no-value-in-a-slot"]], "23. How can I benchmark my network?": [[0, "how-can-i-benchmark-my-network"]], "24. How to set workspace_size_per_gpu_in_mb and slot_size_array?": [[0, "how-to-set-workspace-size-per-gpu-in-mb-and-slot-size-array"]], "25. Is nvlink required in HugeCTR?": [[0, "is-nvlink-required-in-hugectr"]], "26. Is DGX the only GPU server that is required in HugeCTR?": [[0, "is-dgx-the-only-gpu-server-that-is-required-in-hugectr"]], "27. Can HugeCTR run without InfiniBand?": [[0, "id1"]], "28. Does HugeCTR support loading pretrained embeddings in other formats?": [[0, "does-hugectr-support-loading-pretrained-embeddings-in-other-formats"]], "29. How to construct the model graph with branch topology in HugeCTR?": [[0, "how-to-construct-the-model-graph-with-branch-topology-in-hugectr"]], "30. What is the good practice of configuring the embedding vector size?": [[0, "what-is-the-good-practice-of-configuring-the-embedding-vector-size"]], "31. How to resolve the bus error when running HugeCTR samples and notebooks?": [[0, "how-to-resolve-the-bus-error-when-running-hugectr-samples-and-notebooks"]], "32. What does the log \u201cmemory pool is empty\u201d imply for HugeCTR inference?": [[0, "what-does-the-log-memory-pool-is-empty-imply-for-hugectr-inference"]], "Additional Resources": [[1, "additional-resources"]], "HugeCTR Layer Classes and Methods": [[2, "hugectr-layer-classes-and-methods"]], "Input Layer": [[2, "input-layer"]], "Sparse Embedding": [[2, "sparse-embedding"]], "Embedding Types Detail": [[2, "embedding-types-detail"]], "DistributedSlotSparseEmbeddingHash Layer": [[2, "distributedslotsparseembeddinghash-layer"]], "LocalizedSlotSparseEmbeddingHash Layer": [[2, "localizedslotsparseembeddinghash-layer"]], "LocalizedSlotSparseEmbeddingOneHot Layer": [[2, "localizedslotsparseembeddingonehot-layer"]], "Dense Layers": [[2, "dense-layers"]], "Dense Layers Usage": [[2, "dense-layers-usage"]], "FullyConnected Layer": [[2, "fullyconnected-layer"]], "MLP Layer": [[2, "mlp-layer"]], "MultiCross Layer": [[2, "multicross-layer"]], "FmOrder2 Layer": [[2, "fmorder2-layer"]], "WeightMultiply Layer": [[2, "weightmultiply-layer"]], "ElementwiseMultiply Layer": [[2, "elementwisemultiply-layer"]], "BatchNorm Layer": [[2, "batchnorm-layer"]], "LayerNorm Layer": [[2, "layernorm-layer"]], "Concat Layer": [[2, "concat-layer"]], "Reshape Layer": [[2, "reshape-layer"]], "Select Layer": [[2, "select-layer"]], "Slice Layer": [[2, "slice-layer"]], "Dropout Layer": [[2, "dropout-layer"]], "ELU Layer": [[2, "elu-layer"]], "ReLU Layer": [[2, "relu-layer"]], "Sigmoid Layer": [[2, "sigmoid-layer"]], "Interaction Layer": [[2, "interaction-layer"]], "Add Layer": [[2, "add-layer"]], "ReduceSum Layer": [[2, "reducesum-layer"]], "GRU Layer": [[2, "gru-layer"]], "PReLUDice Layer": [[2, "preludice-layer"]], "Scale Layer": [[2, "scale-layer"]], "FusedReshapeConcat Layer": [[2, "fusedreshapeconcat-layer"]], "FusedReshapeConcatGeneral Layer": [[2, "fusedreshapeconcatgeneral-layer"]], "Softmax Layer": [[2, "softmax-layer"]], "Sub Layer": [[2, "sub-layer"]], "ReduceMean Layer": [[2, "reducemean-layer"]], "MatrixMutiply Layer": [[2, "matrixmutiply-layer"]], "MultiHeadAttention Layer": [[2, "multiheadattention-layer"]], "SequenceMask Layer": [[2, "sequencemask-layer"]], "Gather Layer": [[2, "gather-layer"]], "BinaryCrossEntropyLoss": [[2, "binarycrossentropyloss"]], "CrossEntropyLoss": [[2, "crossentropyloss"]], "MultiCrossEntropyLoss": [[2, "multicrossentropyloss"]], "Embedding Collection": [[2, "embedding-collection"]], "About the HugeCTR embedding collection": [[2, "about-the-hugectr-embedding-collection"]], "Overview of using the HugeCTR embedding collection": [[2, "overview-of-using-the-hugectr-embedding-collection"]], "Known Limitations": [[2, "known-limitations"]], "EmbeddingTableConfig": [[2, "embeddingtableconfig"]], "EmbeddingCollectionConfig": [[2, "embeddingcollectionconfig"]], "embedding_lookup method": [[2, "embedding-lookup-method"]], "shard method": [[2, "shard-method"]], "HugeCTR API Documentation": [[3, "hugectr-api-documentation"]], "HugeCTR Python Interface": [[4, "hugectr-python-interface"]], "About the HugeCTR Python Interface": [[4, "about-the-hugectr-python-interface"]], "High-level Training API": [[4, "high-level-training-api"]], "Solver": [[4, "solver"]], "CreateSolver method": [[4, "createsolver-method"]], "AsyncParam": [[4, "asyncparam"]], "AsyncParam class": [[4, "asyncparam-class"]], "HybridEmbeddingParam": [[4, "hybridembeddingparam"]], "HybridEmbeddingParam class": [[4, "hybridembeddingparam-class"]], "DataReaderParams": [[4, "datareaderparams"]], "DataReaderParams class": [[4, "datareaderparams-class"]], "Dataset formats": [[4, "dataset-formats"]], "Data Files": [[4, "data-files"]], "File List": [[4, "file-list"]], "Raw": [[4, "raw"]], "Parquet": [[4, "parquet"]], "OptParamsPy": [[4, "optparamspy"]], "CreateOptimizer method": [[4, "createoptimizer-method"]], "Layers": [[4, "layers"]], "Model": [[4, "model"], [4, "id2"]], "Model class": [[4, "model-class"]], "add method": [[4, "add-method"]], "compile method": [[4, "compile-method"]], "fit method": [[4, "fit-method"]], "summary method": [[4, "summary-method"]], "graph_to_json method": [[4, "graph-to-json-method"]], "construct_from_json method": [[4, "construct-from-json-method"]], "load_dense_weights method": [[4, "load-dense-weights-method"]], "load_dense_optimizer_states method": [[4, "load-dense-optimizer-states-method"]], "load_sparse_weights method": [[4, "load-sparse-weights-method"]], "load_sparse_optimizer_states method": [[4, "load-sparse-optimizer-states-method"]], "freeze_dense method": [[4, "freeze-dense-method"]], "freeze_embedding method": [[4, "freeze-embedding-method"]], "unfreeze_dense method": [[4, "unfreeze-dense-method"]], "unfreeze_embedding method": [[4, "unfreeze-embedding-method"]], "reset_learning_rate_scheduler method": [[4, "reset-learning-rate-scheduler-method"]], "set_source method": [[4, "set-source-method"], [4, "id1"]], "Low-level Training API": [[4, "low-level-training-api"]], "LearningRateScheduler": [[4, "learningratescheduler"]], "get_next method": [[4, "get-next-method"]], "DataReader": [[4, "datareader"]], "is_eof method": [[4, "is-eof-method"]], "get_learning_rate_scheduler method": [[4, "get-learning-rate-scheduler-method"]], "get_data_reader_train method": [[4, "get-data-reader-train-method"]], "get_data_reader_eval method": [[4, "get-data-reader-eval-method"]], "start_data_reading method": [[4, "start-data-reading-method"]], "set_learning_rate method": [[4, "set-learning-rate-method"]], "train method": [[4, "train-method"]], "get_current_loss method": [[4, "get-current-loss-method"]], "eval method": [[4, "eval-method"]], "get_eval_metrics method": [[4, "get-eval-metrics-method"]], "save_params_to_files method": [[4, "save-params-to-files-method"]], "check_out_tensor method": [[4, "check-out-tensor-method"], [4, "id3"]], "Inference API": [[4, "inference-api"]], "InferenceParams": [[4, "inferenceparams"]], "InferenceParams class": [[4, "inferenceparams-class"]], "InferenceModel": [[4, "inferencemodel"]], "InferenceModel class": [[4, "inferencemodel-class"]], "predict method": [[4, "predict-method"]], "evaluate method": [[4, "evaluate-method"]], "Data Generator API": [[4, "data-generator-api"]], "DataGeneratorParams class": [[4, "datageneratorparams-class"]], "DataGenerator": [[4, "datagenerator"]], "DataGenerator class": [[4, "datagenerator-class"]], "generate method": [[4, "generate-method"]], "Data Source API": [[4, "data-source-api"]], "DataSourceParams class": [[4, "datasourceparams-class"]], "Hierarchical Parameter Server Database Backend": [[5, "hierarchical-parameter-server-database-backend"]], "Introduction to the HPS Database Backend": [[5, "introduction-to-the-hps-database-backend"]], "Background": [[5, "background"]], "Architecture": [[5, "architecture"]], "Training and Iterative Model Updates": [[5, "training-and-iterative-model-updates"]], "Execution": [[5, "execution"]], "Inference": [[5, "inference"]], "Training": [[5, "training"], [53, "training"], [53, "id3"]], "Lookup Optimization": [[5, "lookup-optimization"]], "Configuration": [[5, "configuration"]], "Inference Parameters and Embedding Cache Configuration": [[5, "inference-parameters-and-embedding-cache-configuration"]], "Inference Params Syntax": [[5, "inference-params-syntax"]], "Inference Parameters": [[5, "inference-parameters"]], "Parameter Server Configuration: Models": [[5, "parameter-server-configuration-models"]], "Volatile Database Configuration": [[5, "volatile-database-configuration"]], "Volatile Database Params Syntax": [[5, "volatile-database-params-syntax"]], "Parameter Server Configuration: Volatile Database": [[5, "parameter-server-configuration-volatile-database"]], "Volatile Database Parameters": [[5, "volatile-database-parameters"]], "Overflow Parameters": [[5, "overflow-parameters"]], "Common Volatile Database Parameters": [[5, "common-volatile-database-parameters"]], "Persistent Database Configuration": [[5, "persistent-database-configuration"]], "Persistent Database Params Syntax": [[5, "persistent-database-params-syntax"]], "Parameter Server Configuration: Persistent Database": [[5, "parameter-server-configuration-persistent-database"]], "Persistent Database Parameters": [[5, "persistent-database-parameters"]], "Update Source Configuration": [[5, "update-source-configuration"]], "Update Source Params Syntax": [[5, "update-source-params-syntax"]], "Parameter Server Configuration: Update Source": [[5, "parameter-server-configuration-update-source"]], "Update Source Parameters": [[5, "update-source-parameters"]], "Benchmark the DLRM Model with HPS": [[6, "benchmark-the-dlrm-model-with-hps"]], "Benchmark Setup": [[6, "benchmark-setup"]], "Results": [[6, "results"]], "Resources": [[6, "resources"]], "Hierarchical Parameter Server API": [[7, "hierarchical-parameter-server-api"]], "HPS Initialize": [[8, "hps-initialize"]], "HPS Layers": [[9, "hps-layers"]], "SparseLookupLayer": [[9, "sparselookuplayer"]], "LookupLayer": [[9, "lookuplayer"]], "Hierarchical Parameter Server Plugin for TensorFlow": [[10, "hierarchical-parameter-server-plugin-for-tensorflow"]], "Introduction to the HPS Plugin for TensorFlow": [[10, "introduction-to-the-hps-plugin-for-tensorflow"]], "Benefits of the Plugin for TensorFlow": [[10, "benefits-of-the-plugin-for-tensorflow"]], "Workflow": [[10, "workflow"], [17, "workflow"]], "Installation": [[10, "installation"], [13, "installation"], [17, "installation"], [20, "installation"], [21, "installation"], [22, "installation"], [23, "installation"], [24, "installation"], [26, "installation"], [27, "installation"], [28, "installation"], [30, "installation"], [31, "installation"], [32, "installation"], [33, "installation"]], "Compute Capability": [[10, "compute-capability"], [13, "compute-capability"], [17, "compute-capability"], [38, "compute-capability"]], "Installing HPS Using NGC Containers": [[10, "installing-hps-using-ngc-containers"], [13, "installing-hps-using-ngc-containers"], [17, "installing-hps-using-ngc-containers"]], "Example Notebooks": [[10, "example-notebooks"], [13, "example-notebooks"], [17, "example-notebooks"]], "Benchmark": [[10, "benchmark"], [17, "benchmark"]], "HPS Plugin for Torch API": [[11, "hps-plugin-for-torch-api"]], "HPS Plugin for Torch": [[12, "hps-plugin-for-torch"]], "LookupLayer class": [[12, "lookuplayer-class"]], "Hierarchical Parameter Server Plugin for Torch": [[13, "hierarchical-parameter-server-plugin-for-torch"]], "Introduction to the HPS Plugin for Torch": [[13, "introduction-to-the-hps-plugin-for-torch"]], "HPS Plugin": [[14, "hps-plugin"]], "HPS Plugin Creator": [[15, "hps-plugin-creator"]], "HPS Plugin for TensorRT API": [[16, "hps-plugin-for-tensorrt-api"]], "Hierarchical Parameter Server Plugin for TensorRT": [[17, "hierarchical-parameter-server-plugin-for-tensorrt"]], "Introduction to the HPS Plugin for TensorRT": [[17, "introduction-to-the-hps-plugin-for-tensorrt"]], "Hierarchical Parameter Server": [[18, "hierarchical-parameter-server"], [36, "hierarchical-parameter-server"]], "Profiling HPS": [[19, "profiling-hps"]], "HPS profiler": [[19, "hps-profiler"]], "Build and install the HPS Profiler": [[19, "build-and-install-the-hps-profiler"]], "Create a synthetic embedding table": [[19, "create-a-synthetic-embedding-table"]], "Use the HPS Profiler to get the measurement results": [[19, "use-the-hps-profiler-to-get-the-measurement-results"]], "Profile HPS with Triton Perf Analyzer:": [[19, "profile-hps-with-triton-perf-analyzer"]], "HPS Profiler vs. Triton Perf Analyzer:": [[19, "hps-profiler-vs-triton-perf-analyzer"]], "Hierarchical Parameter Server Demo": [[20, "hierarchical-parameter-server-demo"], [41, "hierarchical-parameter-server-demo"]], "Overview": [[20, "overview"], [21, "overview"], [22, "overview"], [23, "overview"], [24, "overview"], [26, "overview"], [27, "overview"], [28, "overview"], [30, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [41, "overview"], [42, "overview"], [44, "overview"], [53, "overview"]], "Get HPS from NGC": [[20, "get-hps-from-ngc"], [21, "get-hps-from-ngc"], [22, "get-hps-from-ngc"], [23, "get-hps-from-ngc"], [24, "get-hps-from-ngc"], [28, "get-hps-from-ngc"]], "Configurations": [[20, "configurations"], [21, "configurations"], [22, "configurations"], [24, "configurations"], [26, "configurations"], [27, "configurations"], [32, "configurations"], [33, "configurations"]], "Train with native TF layers": [[20, "train-with-native-tf-layers"], [21, "train-with-native-tf-layers"], [22, "train-with-native-tf-layers"], [24, "train-with-native-tf-layers"], [33, "train-with-native-tf-layers"]], "Create the inference graph with HPS LookupLayer": [[20, "create-the-inference-graph-with-hps-lookuplayer"], [24, "create-the-inference-graph-with-hps-lookuplayer"]], "Inference with saved model graph": [[20, "inference-with-saved-model-graph"], [21, "inference-with-saved-model-graph"], [26, "inference-with-saved-model-graph"]], "HPS for Multiple Tables and Sparse Inputs": [[21, "hps-for-multiple-tables-and-sparse-inputs"]], "Create the inference graph with HPS SparseLookupLayer and LookupLayer": [[21, "create-the-inference-graph-with-hps-sparselookuplayer-and-lookuplayer"]], "HPS Pretrained Model Training Demo": [[22, "hps-pretrained-model-training-demo"]], "Load the pre-trained embeddings via HPS": [[22, "load-the-pre-trained-embeddings-via-hps"]], "HPS Table Fusion Demo": [[23, "hps-table-fusion-demo"]], "Create TF SavedModel": [[23, "create-tf-savedmodel"]], "Make inference with HPS table fusion": [[23, "make-inference-with-hps-table-fusion"]], "Deploy SavedModel using HPS with Triton TensorFlow Backend": [[24, "deploy-savedmodel-using-hps-with-triton-tensorflow-backend"], [24, "id1"]], "Deploy TF-TRT SavedModel using HPS with Triton TensorFlow Backend": [[24, "deploy-tf-trt-savedmodel-using-hps-with-triton-tensorflow-backend"]], "Hierarchical Parameter Server Notebooks": [[25, "hierarchical-parameter-server-notebooks"], [29, "hierarchical-parameter-server-notebooks"]], "Quickstart": [[25, "quickstart"], [29, "quickstart"], [34, "quickstart"]], "Pull the NGC Docker": [[25, "pull-the-ngc-docker"], [29, "pull-the-ngc-docker"]], "Clone the HugeCTR Repository": [[25, "clone-the-hugectr-repository"], [29, "clone-the-hugectr-repository"], [34, "clone-the-hugectr-repository"]], "Start the Jupyter Notebook": [[25, "start-the-jupyter-notebook"], [29, "start-the-jupyter-notebook"], [34, "start-the-jupyter-notebook"]], "Notebook List": [[25, "notebook-list"], [29, "notebook-list"], [34, "notebook-list"], [43, "notebook-list"]], "System Specifications": [[25, "system-specifications"], [29, "system-specifications"], [34, "system-specifications"], [43, "system-specifications"]], "SOK to HPS DLRM Demo": [[26, "sok-to-hps-dlrm-demo"]], "Get SOK from NGC": [[26, "get-sok-from-ngc"], [27, "get-sok-from-ngc"]], "Train with SOK embedding layers": [[26, "train-with-sok-embedding-layers"]], "Create the inference graph with HPS SparseLookupLayer": [[26, "create-the-inference-graph-with-hps-sparselookuplayer"]], "SOK Train DLRM Demo": [[27, "sok-train-dlrm-demo"]], "Build model with SOK embedding layers": [[27, "build-model-with-sok-embedding-layers"]], "Train with SOK models": [[27, "train-with-sok-models"]], "HPS Torch Demo": [[28, "hps-torch-demo"]], "Data Generation": [[28, "data-generation"], [31, "data-generation"], [41, "data-generation"]], "Lookup with Table Fusion": [[28, "lookup-with-table-fusion"]], "HPS TensorRT Plugin Benchmark for TensorFlow Large Model": [[30, "hps-tensorrt-plugin-benchmark-for-tensorflow-large-model"]], "Use NGC": [[30, "use-ngc"], [31, "use-ngc"], [32, "use-ngc"], [33, "use-ngc"]], "1. Create the TF model": [[30, "create-the-tf-model"]], "2. Build the HPS-integrated TensorRT engine": [[30, "build-the-hps-integrated-tensorrt-engine"]], "Step1: Prepare the 147GB embedding table": [[30, "step1-prepare-the-147gb-embedding-table"]], "1.1 Train a 147GB model from scratch": [[30, "train-a-147gb-model-from-scratch"]], "1.2 Get the embedding model file in hps format": [[30, "get-the-embedding-model-file-in-hps-format"]], "Step2: Prepare JSON configuration file for HPS": [[30, "step2-prepare-json-configuration-file-for-hps"]], "Step3: Convert to ONNX and do ONNX graph surgery": [[30, "step3-convert-to-onnx-and-do-onnx-graph-surgery"]], "Step4: Build the TensorRT engine": [[30, "step4-build-the-tensorrt-engine"]], "3. Benchmark HPS-integrated TensorRT engine on Triton": [[30, "benchmark-hps-integrated-tensorrt-engine-on-triton"]], "Step1: Create the model repository": [[30, "step1-create-the-model-repository"]], "Step2: Prepare the benchmark input data": [[30, "step2-prepare-the-benchmark-input-data"]], "Step3: Launch the Triton inference server": [[30, "step3-launch-the-triton-inference-server"]], "Step4: Run the benchmark": [[30, "step4-run-the-benchmark"]], "4. Benchmark for ARM64 or Grace + Hooper systems": [[30, "benchmark-for-arm64-or-grace-hooper-systems"]], "Step 1: Build the NVIDIA Merlin docker images": [[30, "step-1-build-the-nvidia-merlin-docker-images"]], "Step 2: Prepare host system for running the docker container": [[30, "step-2-prepare-host-system-for-running-the-docker-container"]], "Step 3: Create the model": [[30, "step-3-create-the-model"]], "Step 4: Prepare data": [[30, "step-4-prepare-data"]], "Step 5: Run benchmark": [[30, "step-5-run-benchmark"]], "HPS TensorRT Plugin Demo for HugeCTR Trained Model": [[31, "hps-tensorrt-plugin-demo-for-hugectr-trained-model"]], "Train with HugeCTR": [[31, "train-with-hugectr"]], "Build the HPS-integrated TensorRT engine": [[31, "build-the-hps-integrated-tensorrt-engine"], [32, "build-the-hps-integrated-tensorrt-engine"], [33, "build-the-hps-integrated-tensorrt-engine"]], "Step1: Prepare JSON configuration file for HPS": [[31, "step1-prepare-json-configuration-file-for-hps"]], "Step2: Convert to ONNX and do ONNX graph surgery": [[31, "step2-convert-to-onnx-and-do-onnx-graph-surgery"], [32, "step2-convert-to-onnx-and-do-onnx-graph-surgery"], [33, "step2-convert-to-onnx-and-do-onnx-graph-surgery"]], "Step3: Build the TensorRT engine": [[31, "step3-build-the-tensorrt-engine"], [32, "step3-build-the-tensorrt-engine"], [33, "step3-build-the-tensorrt-engine"]], "Deploy HPS-integrated TensorRT engine on Triton": [[31, "deploy-hps-integrated-tensorrt-engine-on-triton"], [32, "deploy-hps-integrated-tensorrt-engine-on-triton"]], "HPS TensorRT Plugin Demo for PyTorch Trained Model": [[32, "hps-tensorrt-plugin-demo-for-pytorch-trained-model"]], "Train with PyTorch": [[32, "train-with-pytorch"]], "Step1: Prepare sparse model and JSON configuration file for HPS": [[32, "step1-prepare-sparse-model-and-json-configuration-file-for-hps"], [33, "step1-prepare-sparse-model-and-json-configuration-file-for-hps"]], "HPS TensorRT Plugin Demo for TensorFlow Trained Model": [[33, "hps-tensorrt-plugin-demo-for-tensorflow-trained-model"]], "Deploy HPS-integrated TensorRT engine with Triton on multiple GPUs": [[33, "deploy-hps-integrated-tensorrt-engine-with-triton-on-multiple-gpus"]], "HPS Plugin for TensorRT Notebooks": [[34, "hps-plugin-for-tensorrt-notebooks"]], "Pull the Container from NGC": [[34, "pull-the-container-from-ngc"]], "Contributing to HugeCTR": [[35, "contributing-to-hugectr"]], "Overview of Contributing to HugeCTR": [[35, "overview-of-contributing-to-hugectr"]], "Contribute New Code": [[35, "contribute-new-code"]], "How to Start your Development": [[35, "how-to-start-your-development"]], "Set Up the Development Environment With Merlin Containers": [[35, "set-up-the-development-environment-with-merlin-containers"]], "Build HugeCTR Training Container from Source": [[35, "build-hugectr-training-container-from-source"]], "Build HugeCTR Inference Container from Source": [[35, "build-hugectr-inference-container-from-source"]], "Build Sparse Operation Kit (SOK) from Source": [[35, "build-sparse-operation-kit-sok-from-source"]], "HugeCTR Core Features": [[36, "hugectr-core-features"]], "Summary of Core Features": [[36, "summary-of-core-features"]], "Model Parallel Training": [[36, "model-parallel-training"]], "Multi-Node Training": [[36, "multi-node-training"]], "Mixed Precision Training": [[36, "mixed-precision-training"]], "SGD Optimizer and Learning Rate Scheduling": [[36, "sgd-optimizer-and-learning-rate-scheduling"]], "HugeCTR to ONNX Converter": [[36, "hugectr-to-onnx-converter"]], "HDFS Support": [[36, "hdfs-support"]], "Sparse Operation Kit": [[36, "sparse-operation-kit"], [56, "sparse-operation-kit"]], "HugeCTR Talks and Blogs": [[37, "hugectr-talks-and-blogs"]], "Talks": [[37, "talks"]], "Blogs": [[37, "blogs"]], "Introduction to HugeCTR": [[38, "introduction-to-hugectr"]], "About HugeCTR": [[38, "about-hugectr"]], "Installing and Building HugeCTR": [[38, "installing-and-building-hugectr"]], "Installing HugeCTR Using NGC Containers": [[38, "installing-hugectr-using-ngc-containers"]], "Building HugeCTR from Scratch": [[38, "building-hugectr-from-scratch"]], "Tools": [[38, "tools"]], "Generating Synthetic Data and Benchmarks": [[38, "generating-synthetic-data-and-benchmarks"]], "Downloading and Preprocessing Datasets": [[38, "downloading-and-preprocessing-datasets"]], "Merlin HugeCTR": [[39, "merlin-hugectr"]], "Related Resources": [[39, "related-resources"]], "HugeCTR Embedding Collection": [[40, "hugectr-embedding-collection"]], "About this Notebook": [[40, "about-this-notebook"]], "Concepts and API Reference": [[40, "concepts-and-api-reference"]], "Setup": [[40, "setup"], [41, "setup"], [42, "setup"]], "Use an Embedding Collection with a DLRM Model": [[40, "use-an-embedding-collection-with-a-dlrm-model"]], "Data Preparation": [[40, "data-preparation"], [42, "data-preparation"], [53, "data-preparation"]], "Run the following commands on the terminal to prepare the data for this notebook": [[40, "run-the-following-commands-on-the-terminal-to-prepare-the-data-for-this-notebook"]], "Prepare the Training Script": [[40, "prepare-the-training-script"]], "Embedding Table Placement Strategy: Round Robin": [[40, "embedding-table-placement-strategy-round-robin"]], "Embedding Table Placement Strategy: Uniform": [[40, "embedding-table-placement-strategy-uniform"]], "Embedding Table Placement Strategy: Hybrid": [[40, "embedding-table-placement-strategy-hybrid"]], "Use Dynamic Hash Table with Round Robin Table Placement Strategy": [[40, "use-dynamic-hash-table-with-round-robin-table-placement-strategy"]], "Train from Scratch": [[41, "train-from-scratch"]], "Convert HugeCTR to ONNX": [[41, "convert-hugectr-to-onnx"]], "1. Inference with HPS & ONNX": [[41, "inference-with-hps-onnx"]], "2. Lookup the Embedding Vector from DLPack": [[41, "lookup-the-embedding-vector-from-dlpack"]], "3. Multi-process inference": [[41, "multi-process-inference"]], "4. Redis Cluster deployment (without TLS/SSL)": [[41, "redis-cluster-deployment-without-tls-ssl"]], "5. Redis Cluster deployment (with TLS/SSL)": [[41, "redis-cluster-deployment-with-tls-ssl"]], "HugeCTR End-end Example with NVTabular": [[42, "hugectr-end-end-example-with-nvtabular"]], "Data Preprocessing using NVTabular": [[42, "data-preprocessing-using-nvtabular"]], "Training a WDL model with HugeCTR": [[42, "training-a-wdl-model-with-hugectr"]], "HugeCTR Example Notebooks": [[43, "hugectr-example-notebooks"]], "1. Clone the HugeCTR Repository": [[43, "clone-the-hugectr-repository"]], "2. Pull the NGC Docker and run it": [[43, "pull-the-ngc-docker-and-run-it"]], "3. Customized Building (Optional)": [[43, "customized-building-optional"]], "4. Start the Jupyter Notebook": [[43, "start-the-jupyter-notebook"]], "Training Recommender Systems on Multi-modal Data": [[44, "training-recommender-systems-on-multi-modal-data"]], "MovieLens-25M: Download and Convert": [[45, "movielens-25m-download-and-convert"]], "Getting Started": [[45, "getting-started"]], "Convert the dataset": [[45, "convert-the-dataset"]], "Splitting into train and validation dataset": [[45, "splitting-into-train-and-validation-dataset"]], "Next steps": [[45, "next-steps"]], "MovieLens Data Enrichment": [[46, "movielens-data-enrichment"]], "Scraping data from IMDB": [[46, "scraping-data-from-imdb"]], "Collect synopsis for all movies": [[46, "collect-synopsis-for-all-movies"]], "Scraping movie posters": [[46, "scraping-movie-posters"]], "Movie Poster Feature Extraction with ResNet": [[47, "movie-poster-feature-extraction-with-resnet"]], "Download a pretrained ResNet-50 from NVIDIA GPU cloud": [[47, "download-a-pretrained-resnet-50-from-nvidia-gpu-cloud"]], "Extract features for all movies": [[47, "extract-features-for-all-movies"]], "Movie Synopsis Feature Extraction with Bart text summarization": [[48, "movie-synopsis-feature-extraction-with-bart-text-summarization"]], "Download pretrained BART model": [[48, "download-pretrained-bart-model"]], "Extracting embeddings for all movie\u2019s synopsis": [[48, "extracting-embeddings-for-all-movie-s-synopsis"]], "Creating Multi-Modal Movie Feature Store": [[49, "creating-multi-modal-movie-feature-store"]], "Real data": [[49, "real-data"]], "Synthetic data": [[49, "synthetic-data"]], "ETL with NVTabular": [[50, "etl-with-nvtabular"]], "Defining our Preprocessing Pipeline": [[50, "defining-our-preprocessing-pipeline"]], "Running the pipeline": [[50, "running-the-pipeline"]], "Checking the pre-processing outputs": [[50, "checking-the-pre-processing-outputs"]], "Training HugeCTR Model with Pre-trained Embeddings": [[51, "training-hugectr-model-with-pre-trained-embeddings"]], "Loading pretrained movie features into non-trainable embedding layer": [[51, "loading-pretrained-movie-features-into-non-trainable-embedding-layer"]], "Define and train model": [[51, "define-and-train-model"]], "Multi-modal Example Notebooks": [[52, "multi-modal-example-notebooks"]], "HugeCTR Training with Remote File System Example": [[53, "hugectr-training-with-remote-file-system-example"]], "Setup HugeCTR": [[53, "setup-hugectr"]], "Training with HDFS Example": [[53, "training-with-hdfs-example"]], "Training a DLRM model": [[53, "training-a-dlrm-model"]], "Training a DCN model with AWS S3": [[53, "training-a-dcn-model-with-aws-s3"]], "Data preparation": [[53, "id1"], [53, "id2"]], "Training a DCN model with Google Cloud Storage": [[53, "training-a-dcn-model-with-google-cloud-storage"]], "Performance": [[54, "performance"]], "MLPerf on DGX-2 and DGX A100": [[54, "mlperf-on-dgx-2-and-dgx-a100"]], "Evaluating HugeCTR\u2019s Performance on the DGX-1": [[54, "evaluating-hugectr-s-performance-on-the-dgx-1"]], "Evaluating HugeCTR\u2019s Performance on TensorFlow": [[54, "evaluating-hugectr-s-performance-on-tensorflow"]], "Release Notes": [[55, "release-notes"]], "What\u2019s New in Version 24.06": [[55, "what-s-new-in-version-24-06"]], "What\u2019s New in Version 23.12": [[55, "what-s-new-in-version-23-12"]], "What\u2019s New in Version 23.11": [[55, "what-s-new-in-version-23-11"]], "What\u2019s New in Version 23.08": [[55, "what-s-new-in-version-23-08"]], "What\u2019s New in Version 23.06": [[55, "what-s-new-in-version-23-06"]], "What\u2019s New in Version 23.04": [[55, "what-s-new-in-version-23-04"]], "What\u2019s New in Version 23.02": [[55, "what-s-new-in-version-23-02"]], "What\u2019s New in Version 4.3": [[55, "what-s-new-in-version-4-3"]], "What\u2019s New in Version 4.2": [[55, "what-s-new-in-version-4-2"]], "What\u2019s New in Version 4.1": [[55, "what-s-new-in-version-4-1"]], "What\u2019s New in Version 4.0": [[55, "what-s-new-in-version-4-0"]], "What\u2019s New in Version 3.9": [[55, "what-s-new-in-version-3-9"]], "What\u2019s New in Version 3.8": [[55, "what-s-new-in-version-3-8"]], "What\u2019s New in Version 3.7": [[55, "what-s-new-in-version-3-7"]], "What\u2019s New in Version 3.6": [[55, "what-s-new-in-version-3-6"]], "What\u2019s New in Version 3.5": [[55, "what-s-new-in-version-3-5"]], "What\u2019s New in Version 3.4.1": [[55, "what-s-new-in-version-3-4-1"]], "What\u2019s New in Version 3.4": [[55, "what-s-new-in-version-3-4"]], "What\u2019s New in Version 3.3.1": [[55, "what-s-new-in-version-3-3-1"]], "What\u2019s New in Version 3.3": [[55, "what-s-new-in-version-3-3"]], "What\u2019s New in Version 3.2.1": [[55, "what-s-new-in-version-3-2-1"]], "What\u2019s New in Version 3.2": [[55, "what-s-new-in-version-3-2"]], "What\u2019s New in Version 3.1": [[55, "what-s-new-in-version-3-1"]], "What\u2019s New in Version 3.0.1": [[55, "what-s-new-in-version-3-0-1"]], "What\u2019s New in Version 3.0": [[55, "whats-new-in-version-3-0"]], "What\u2019s New in Version 2.3": [[55, "what-s-new-in-version-2-3"]], "Known Issues": [[55, "known-issues"]]}, "indexentries": {"init() (in module hierarchical_parameter_server)": [[8, "hierarchical_parameter_server.Init"]], "lookuplayer (class in hierarchical_parameter_server)": [[9, "hierarchical_parameter_server.LookupLayer"]], "sparselookuplayer (class in hierarchical_parameter_server)": [[9, "hierarchical_parameter_server.SparseLookupLayer"]], "call() (hierarchical_parameter_server.lookuplayer method)": [[9, "hierarchical_parameter_server.LookupLayer.call"]], "call() (hierarchical_parameter_server.sparselookuplayer method)": [[9, "hierarchical_parameter_server.SparseLookupLayer.call"]]}})
\ No newline at end of file