Upload PatentBERT_conversion.ipynb
Browse files
PatentBERT_conversion.ipynb
CHANGED
|
@@ -856,7 +856,7 @@
|
|
| 856 |
},
|
| 857 |
{
|
| 858 |
"cell_type": "code",
|
| 859 |
-
"execution_count":
|
| 860 |
"metadata": {},
|
| 861 |
"outputs": [
|
| 862 |
{
|
|
@@ -912,7 +912,7 @@
|
|
| 912 |
"import os\n",
|
| 913 |
"\n",
|
| 914 |
"# Load the real CPC labels\n",
|
| 915 |
-
"label_file_path = \"
|
| 916 |
"cpc_df = pd.read_csv(label_file_path, sep='\\t')\n",
|
| 917 |
"\n",
|
| 918 |
"print(f\"✅ Loaded {len(cpc_df)} real CPC labels from PatentBERT\")\n",
|
|
|
|
| 856 |
},
|
| 857 |
{
|
| 858 |
"cell_type": "code",
|
| 859 |
+
"execution_count": null,
|
| 860 |
"metadata": {},
|
| 861 |
"outputs": [
|
| 862 |
{
|
|
|
|
| 912 |
"import os\n",
|
| 913 |
"\n",
|
| 914 |
"# Load the real CPC labels\n",
|
| 915 |
+
"label_file_path = \"./labels_group_id.tsv\"\n",
|
| 916 |
"cpc_df = pd.read_csv(label_file_path, sep='\\t')\n",
|
| 917 |
"\n",
|
| 918 |
"print(f\"✅ Loaded {len(cpc_df)} real CPC labels from PatentBERT\")\n",
|