Skip to content

Commit

Permalink
minor tutorial updates
Browse files Browse the repository at this point in the history
Signed-off-by: Sarah Yurick <[email protected]>
  • Loading branch information
sarahyurick committed Feb 13, 2025
1 parent 7d006e8 commit 85133a2
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -1804,7 +1804,7 @@
"components_stage = ConnectedComponents(\n",
" cache_dir=cache_dir,\n",
" jaccard_pairs_path=edgelist_path,\n",
" id_column=id_field,\n",
" id_field=id_field,\n",
")\n",
"components_stage.cc_workflow(output_path=output_path)\n",
"print(f\"Connected Component took {time.time()-t0} seconds\")"
Expand Down
6 changes: 3 additions & 3 deletions tutorials/single_node_tutorial/single_gpu_tutorial.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -1338,7 +1338,7 @@
"t0 = time.time()\n",
"print(f\"Computing minhashes for {minhash_data_path}\")\n",
"\n",
"# Load data. Only the [minhash_id_field, text_field] columns are needed\n",
"# Load data. Only the [minhash_id_field, minhash_text_field] columns are needed\n",
"files = get_all_files_paths_under(root=minhash_data_path, recurse_subdirectories=False)\n",
"files = [f for f in files if f.endswith(\".jsonl\")]\n",
"df = read_data(\n",
Expand Down Expand Up @@ -1597,7 +1597,7 @@
"ddf_bk = DocumentDataset.read_parquet(input_bucket_path, backend=\"cudf\")\n",
"\n",
"#Run _MapBuckets()\n",
"buckets_to_edges = BucketsToEdges(cache_dir=edgelist_output_dir, id_fields=input_id_field, logger=buckets_to_edges_log_path)\n",
"buckets_to_edges = BucketsToEdges(cache_dir=edgelist_output_dir, id_fields=id_field, logger=buckets_to_edges_log_path)\n",
"res = buckets_to_edges(ddf_bk)\n",
"\n",
"print(f\"Time taken for Bucket->Edgelist:{time.time()-t0} s\")"
Expand Down Expand Up @@ -1750,7 +1750,7 @@
},
"outputs": [],
"source": [
"# cc_compute_res.groupby('group')[input_id_field].agg(list).reset_index()"
"# cc_compute_res.groupby('group')[id_field].agg(list).reset_index()"
]
},
{
Expand Down

0 comments on commit 85133a2

Please sign in to comment.