Practica 3 del parcial 2

parent 369ad78c
{
"cells": [
{
"cell_type": "code",
"execution_count": 124,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"import re\n",
"from operator import itemgetter \n",
"import matplotlib.pyplot as plt\n",
"import numpy as np\n",
"\n",
"frequency = {}\n",
"open_file = open('data/data_named_entity_recognition_sp_MX_locations.JSON', 'r')\n",
"file_to_string = open_file.read()\n",
"words = re.findall(r'(b[A-Za-z][a-z]{2,9}b)', file_to_string)\n",
"\n",
"for word in words:\n",
" count = frequency.get(word,0)\n",
" frequency[word] = count + 1\n",
"values=[] \n",
"for key, value in reversed(sorted(frequency.items(), key = itemgetter(1))):\n",
" values= np.append(values,[[key,value]])\n",
"\n",
"for i in range(len(values)):\n",
" #print(values[i])\n",
" if(i%2!=0):\n",
" x=np.append(values2,[int(values[i])])\n",
" \n",
"# the histogram of the data\n",
"patches = plt.hist(x, density=True, facecolor='g', alpha=0.75)\n",
"\n",
"plt.xlabel('X')\n",
"plt.ylabel('Y')\n",
"plt.title('La ley de Zipf')\n",
"\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.7"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment