Skip to content

Commit 4d408c9

Browse files
author
iamchiragsharma
committed
Updated Readme
1 parent 509bf9a commit 4d408c9

File tree

4 files changed

+233
-60
lines changed

4 files changed

+233
-60
lines changed
+2
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
# python For Insanes
2+
Okay Threading is tough but you know what's tougher? Controlling the threads

Probabilistic DS/.ipynb_checkpoints/Count Min Sketch-checkpoint.ipynb

+111-29
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
},
1414
{
1515
"cell_type": "code",
16-
"execution_count": 107,
16+
"execution_count": 1,
1717
"metadata": {},
1818
"outputs": [],
1919
"source": [
@@ -25,7 +25,7 @@
2525
},
2626
{
2727
"cell_type": "code",
28-
"execution_count": 146,
28+
"execution_count": 50,
2929
"metadata": {},
3030
"outputs": [],
3131
"source": [
@@ -34,7 +34,7 @@
3434
},
3535
{
3636
"cell_type": "code",
37-
"execution_count": 116,
37+
"execution_count": 51,
3838
"metadata": {},
3939
"outputs": [],
4040
"source": [
@@ -43,7 +43,7 @@
4343
},
4444
{
4545
"cell_type": "code",
46-
"execution_count": 117,
46+
"execution_count": 52,
4747
"metadata": {},
4848
"outputs": [],
4949
"source": [
@@ -53,7 +53,7 @@
5353
},
5454
{
5555
"cell_type": "code",
56-
"execution_count": 118,
56+
"execution_count": 53,
5757
"metadata": {},
5858
"outputs": [],
5959
"source": [
@@ -62,7 +62,7 @@
6262
},
6363
{
6464
"cell_type": "code",
65-
"execution_count": 119,
65+
"execution_count": 54,
6666
"metadata": {},
6767
"outputs": [],
6868
"source": [
@@ -75,7 +75,7 @@
7575
},
7676
{
7777
"cell_type": "code",
78-
"execution_count": 120,
78+
"execution_count": 55,
7979
"metadata": {},
8080
"outputs": [],
8181
"source": [
@@ -84,7 +84,7 @@
8484
},
8585
{
8686
"cell_type": "code",
87-
"execution_count": 121,
87+
"execution_count": 56,
8888
"metadata": {},
8989
"outputs": [],
9090
"source": [
@@ -93,7 +93,7 @@
9393
},
9494
{
9595
"cell_type": "code",
96-
"execution_count": 131,
96+
"execution_count": 57,
9797
"metadata": {},
9898
"outputs": [],
9999
"source": [
@@ -102,7 +102,7 @@
102102
},
103103
{
104104
"cell_type": "code",
105-
"execution_count": 134,
105+
"execution_count": 58,
106106
"metadata": {},
107107
"outputs": [
108108
{
@@ -111,7 +111,7 @@
111111
"('', 80026)"
112112
]
113113
},
114-
"execution_count": 134,
114+
"execution_count": 58,
115115
"metadata": {},
116116
"output_type": "execute_result"
117117
}
@@ -122,44 +122,104 @@
122122
},
123123
{
124124
"cell_type": "code",
125-
"execution_count": null,
125+
"execution_count": 59,
126126
"metadata": {},
127-
"outputs": [],
127+
"outputs": [
128+
{
129+
"data": {
130+
"text/plain": [
131+
"[('the', 34254),\n",
132+
" ('and', 21799),\n",
133+
" ('to', 16569),\n",
134+
" ('of', 14941),\n",
135+
" ('a', 10395),\n",
136+
" ('he', 9574),\n",
137+
" ('in', 8844),\n",
138+
" ('his', 7949),\n",
139+
" ('that', 7589),\n",
140+
" ('was', 7297),\n",
141+
" ('with', 5667),\n",
142+
" ('had', 5348),\n",
143+
" ('it', 4653),\n",
144+
" ('her', 4587),\n",
145+
" ('not', 4571),\n",
146+
" ('at', 4503),\n",
147+
" ('him', 4294),\n",
148+
" ('as', 3913),\n",
149+
" ('on', 3879),\n",
150+
" ('but', 3664),\n",
151+
" ('for', 3426),\n",
152+
" ('she', 3316),\n",
153+
" ('i', 3246),\n",
154+
" ('is', 3165),\n",
155+
" ('you', 2988),\n",
156+
" ('said', 2757),\n",
157+
" ('from', 2670),\n",
158+
" ('all', 2641),\n",
159+
" ('were', 2401),\n",
160+
" ('be', 2386)]"
161+
]
162+
},
163+
"execution_count": 59,
164+
"metadata": {},
165+
"output_type": "execute_result"
166+
}
167+
],
128168
"source": []
129169
},
130170
{
131171
"cell_type": "code",
132-
"execution_count": 136,
172+
"execution_count": 13,
133173
"metadata": {},
134174
"outputs": [],
135-
"source": [
136-
"dataPoints = [d[0] for d in dataCounter]"
137-
]
175+
"source": []
138176
},
139177
{
140178
"cell_type": "code",
141-
"execution_count": 153,
179+
"execution_count": 60,
142180
"metadata": {},
143181
"outputs": [],
144182
"source": [
145183
"def hash_table_creator():\n",
146-
" global dataPoints,count_sketch\n",
184+
" global dataCounter,count_sketch\n",
147185
" hash42 = np.array(list(map(lambda x: mmh3.hash(x,42,signed=False),dataPoints)))\n",
148186
" hash142 = np.array(list(map(lambda x: mmh3.hash(x,142,signed=False),dataPoints)))\n",
149187
" hash1421 = np.array(list(map(lambda x: mmh3.hash(x,1421,signed=False),dataPoints)))\n",
150188
" hash14214 = np.array(list(map(lambda x: mmh3.hash(x,14214,signed=False),dataPoints)))\n",
151189
" hash142142 = np.array(list(map(lambda x: mmh3.hash(x,142142,signed=False),dataPoints)))\n",
152-
" for i in range(len(dataPoints)):\n",
153-
" count_sketch[hash42%100333][0] = hash42[i]\n",
154-
" count_sketch[hash142%100333][1] = hash142[i]\n",
155-
" count_sketch[hash1421%100333][2] = hash1421[i]\n",
156-
" count_sketch[hash14214%100333][3] = hash14214[i]\n",
157-
" count_sketch[hash142142%100333][4] = hash142142[i]"
190+
" for i in range(len(dataCounter)):\n",
191+
" count_sketch[hash42[i]%100333][0] = dataCounter[i][1]\n",
192+
" count_sketch[hash142[i]%100333][1] = dataCounter[i][1]\n",
193+
" count_sketch[hash1421[i]%100333][2] = dataCounter[i][1]\n",
194+
" count_sketch[hash14214[i]%100333][3] = dataCounter[i][1]\n",
195+
" count_sketch[hash142142[i]%100333][4] = dataCounter[i][1]"
158196
]
159197
},
160198
{
161199
"cell_type": "code",
162-
"execution_count": 154,
200+
"execution_count": 61,
201+
"metadata": {},
202+
"outputs": [],
203+
"source": [
204+
"def hash_table_finder(dataPoint):\n",
205+
" global count_sketch\n",
206+
" counting = []\n",
207+
" hash42 = mmh3.hash(dataPoint,42,signed=False)\n",
208+
" hash142 = mmh3.hash(dataPoint,142,signed=False)\n",
209+
" hash1421 = mmh3.hash(dataPoint,1421,signed=False)\n",
210+
" hash14214 = mmh3.hash(dataPoint,14214,signed=False)\n",
211+
" hash142142 = mmh3.hash(dataPoint,142142,signed=False)\n",
212+
" counting.append(count_sketch[hash42%100333][0])\n",
213+
" counting.append(count_sketch[hash142%100333][1])\n",
214+
" counting.append(count_sketch[hash1421%100333][2])\n",
215+
" counting.append(count_sketch[hash14214%100333][3])\n",
216+
" counting.append(count_sketch[hash142142%100333][4])\n",
217+
" return counting"
218+
]
219+
},
220+
{
221+
"cell_type": "code",
222+
"execution_count": 62,
163223
"metadata": {},
164224
"outputs": [],
165225
"source": [
@@ -168,7 +228,7 @@
168228
},
169229
{
170230
"cell_type": "code",
171-
"execution_count": 157,
231+
"execution_count": 63,
172232
"metadata": {},
173233
"outputs": [
174234
{
@@ -183,12 +243,34 @@
183243
" [0, 0, 0, 0, 0]], dtype=int8)"
184244
]
185245
},
186-
"execution_count": 157,
246+
"execution_count": 63,
187247
"metadata": {},
188248
"output_type": "execute_result"
189249
}
190250
],
191-
"source": []
251+
"source": [
252+
"count_sketch"
253+
]
254+
},
255+
{
256+
"cell_type": "code",
257+
"execution_count": 64,
258+
"metadata": {},
259+
"outputs": [
260+
{
261+
"data": {
262+
"text/plain": [
263+
"[-84, 29, -84, -84, -84]"
264+
]
265+
},
266+
"execution_count": 64,
267+
"metadata": {},
268+
"output_type": "execute_result"
269+
}
270+
],
271+
"source": [
272+
"hash_table_finder(\"you\")"
273+
]
192274
},
193275
{
194276
"cell_type": "code",

0 commit comments

Comments
 (0)