|
|
|
@ -692,11 +692,11 @@
|
|
|
|
|
"print(text_ML[:1000])"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "_jiTo03-VchL",
|
|
|
|
|
"outputId": "417c3854-fa28-470f-80ab-f7682ad44264",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/"
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "_jiTo03-VchL",
|
|
|
|
|
"outputId": "417c3854-fa28-470f-80ab-f7682ad44264"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 53,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -791,12 +791,12 @@
|
|
|
|
|
"plot(res_ML)"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "l7e2KaN8WMBr",
|
|
|
|
|
"outputId": "19e1dc73-b6e0-4b68-b614-2065b898f582",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 588
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "l7e2KaN8WMBr",
|
|
|
|
|
"outputId": "19e1dc73-b6e0-4b68-b614-2065b898f582"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 61,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -820,12 +820,12 @@
|
|
|
|
|
"plt.imshow(wc.generate_from_frequencies({ k:v for k,v in res_BD }))"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "S-hEf6AJWm9j",
|
|
|
|
|
"outputId": "3a7c276b-4284-4eaa-ee73-2a0e204e4af6",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 621
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "S-hEf6AJWm9j",
|
|
|
|
|
"outputId": "3a7c276b-4284-4eaa-ee73-2a0e204e4af6"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 63,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -859,12 +859,12 @@
|
|
|
|
|
"plt.imshow(wc.generate_from_frequencies({ k:v for k,v in res_ML }))"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "SwMYEEsDWxh_",
|
|
|
|
|
"outputId": "78c8a028-5e0e-4cf3-ca56-663c42ac30c8",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 621
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "SwMYEEsDWxh_",
|
|
|
|
|
"outputId": "78c8a028-5e0e-4cf3-ca56-663c42ac30c8"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 64,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -897,12 +897,12 @@
|
|
|
|
|
"plt.imshow(wc.generate(text_BD))"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "Ls1MkYJKXBa1",
|
|
|
|
|
"outputId": "5e5978c9-b76b-454e-eb43-6dce3024d245",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 621
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "Ls1MkYJKXBa1",
|
|
|
|
|
"outputId": "5e5978c9-b76b-454e-eb43-6dce3024d245"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 66,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -935,12 +935,12 @@
|
|
|
|
|
"plt.imshow(wc.generate(text_ML))"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "hdAGVczAXJfv",
|
|
|
|
|
"outputId": "e2c9e5ce-0e67-47e8-8935-54465ced6937",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 621
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"id": "hdAGVczAXJfv",
|
|
|
|
|
"outputId": "e2c9e5ce-0e67-47e8-8935-54465ced6937"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 67,
|
|
|
|
|
"outputs": [
|
|
|
|
@ -972,29 +972,10 @@
|
|
|
|
|
"wc.generate(text_BD).to_file('images/ds_wordcloud_bigdata.png')"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"id": "sqCorFXIXWPt",
|
|
|
|
|
"outputId": "2e3da5e8-1588-4f02-bf9a-b10109f024f1",
|
|
|
|
|
"colab": {
|
|
|
|
|
"base_uri": "https://localhost:8080/",
|
|
|
|
|
"height": 322
|
|
|
|
|
}
|
|
|
|
|
"id": "sqCorFXIXWPt"
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 69,
|
|
|
|
|
"outputs": [
|
|
|
|
|
{
|
|
|
|
|
"output_type": "error",
|
|
|
|
|
"ename": "FileNotFoundError",
|
|
|
|
|
"evalue": "ignored",
|
|
|
|
|
"traceback": [
|
|
|
|
|
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
|
|
|
|
"\u001b[0;31mFileNotFoundError\u001b[0m Traceback (most recent call last)",
|
|
|
|
|
"\u001b[0;32m<ipython-input-69-4b0bc35d4a5d>\u001b[0m in \u001b[0;36m<cell line: 1>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mwc\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgenerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtext_BD\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_file\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'images/ds_wordcloud_bigdata.png'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
|
|
|
|
|
"\u001b[0;32m/usr/local/lib/python3.10/dist-packages/wordcloud/wordcloud.py\u001b[0m in \u001b[0;36mto_file\u001b[0;34m(self, filename)\u001b[0m\n\u001b[1;32m 724\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 725\u001b[0m \u001b[0mimg\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_image\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 726\u001b[0;31m \u001b[0mimg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msave\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfilename\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moptimize\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 727\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 728\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
|
|
|
|
|
"\u001b[0;32m/usr/local/lib/python3.10/dist-packages/PIL/Image.py\u001b[0m in \u001b[0;36msave\u001b[0;34m(self, fp, format, **params)\u001b[0m\n\u001b[1;32m 2426\u001b[0m \u001b[0mfp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mbuiltins\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mopen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfilename\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"r+b\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2427\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2428\u001b[0;31m \u001b[0mfp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mbuiltins\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mopen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfilename\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"w+b\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2429\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2430\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
|
|
|
|
|
"\u001b[0;31mFileNotFoundError\u001b[0m: [Errno 2] No such file or directory: 'images/ds_wordcloud_bigdata.png'"
|
|
|
|
|
]
|
|
|
|
|
}
|
|
|
|
|
]
|
|
|
|
|
"execution_count": null,
|
|
|
|
|
"outputs": []
|
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
"cell_type": "code",
|
|
|
|
|