From a21ec4f5c28cb45b13dc2cc64f6bca7701f4708e Mon Sep 17 00:00:00 2001 From: Hemil Desai Date: Mon, 14 Oct 2024 15:36:33 -0700 Subject: [PATCH] Fix Signed-off-by: Hemil Desai --- examples/llm/slimpajama/data_pipeline.ipynb | 21 +++++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/examples/llm/slimpajama/data_pipeline.ipynb b/examples/llm/slimpajama/data_pipeline.ipynb index e1da6b50cf9c6..d59fbbd4685f2 100644 --- a/examples/llm/slimpajama/data_pipeline.ipynb +++ b/examples/llm/slimpajama/data_pipeline.ipynb @@ -36,7 +36,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -46,7 +46,7 @@ "from data.extract import run_extraction\n", "from data.preprocess import preprocess_data\n", "\n", - "HOST_DATA_PATH = \"/home/hemild/dev/data\"" + "HOST_DATA_PATH = \"/data\"" ] }, { @@ -225,9 +225,18 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 3, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "concatenated_chunk1.jsonl_text_document.bin\n", + "concatenated_chunk1.jsonl_text_document.idx\n" + ] + } + ], "source": [ "!ls {HOST_DATA_PATH}/slimpajama_megatron" ] @@ -297,7 +306,7 @@ ], "metadata": { "kernelspec": { - "display_name": ".venv", + "display_name": "Python 3", "language": "python", "name": "python3" }, @@ -311,7 +320,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.3" + "version": "3.10.12" } }, "nbformat": 4,