diff --git a/notebooks/01. data_collect/get_repos_data.ipynb b/notebooks/01. data_collect/get_repos_data.ipynb index 75cd841..05bda4a 100644 --- a/notebooks/01. data_collect/get_repos_data.ipynb +++ b/notebooks/01. data_collect/get_repos_data.ipynb @@ -22,7 +22,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 4, "id": "3cad27e9", "metadata": {}, "outputs": [], @@ -30,7 +30,9 @@ "# Load environment variables from .env file\n", "load_dotenv()\n", "\n", - "dir_name = os.getenv('DIR_NAME')" + "dir_name = os.getenv('DIR_NAME')\n", + "base_path = f'../../data/processed/{dir_name}'\n", + "os.makedirs(base_path, exist_ok=True)" ] }, { @@ -124,7 +126,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "id": "bc9dfc19-e98d-4619-8856-273d97882f57", "metadata": {}, "outputs": [ @@ -132,27 +134,13 @@ "name": "stderr", "output_type": "stream", "text": [ - "Progress Bar: 22%|██▏ | 378/1729 [10:10<28:08, 1.25s/it] " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Request Error: 502\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "Progress Bar: 100%|██████████| 1729/1729 [39:41<00:00, 1.38s/it] \n" + "Progress Bar: 100%|██████████| 1734/1734 [41:48<00:00, 1.45s/it] \n" ] } ], "source": [ "# Load existing data from CSV file into a DataFrame\n", - "users_ids = pd.read_csv(f\"../../data/processed/{dir_name}/users_ids.csv\", encoding='latin1')\n", + "users_ids = pd.read_csv(f\"{base_path}/users_ids.csv\", encoding='latin1')\n", "users_ids = users_ids['user_id'].to_list()\n", "\n", "# Retrieve repository data for user IDs\n", @@ -161,13 +149,13 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "id": "7d89602d-1477-4d4a-95e4-ee2dbcedce0c", "metadata": {}, "outputs": [], "source": [ "# Save repository data to a CSV file\n", - "file_name = f\"../../data/processed/{dir_name}/repos_data.csv\"\n", + "file_name = f\"{base_path}/repos_data.csv\"\n", "users_data = pd.DataFrame(final_data)\n", "users_data.to_csv(file_name, index=False, encoding='latin1')\n", "\n", diff --git a/notebooks/01. data_collect/get_starred_data.ipynb b/notebooks/01. data_collect/get_starred_data.ipynb index 0ff7f9d..2471a02 100644 --- a/notebooks/01. data_collect/get_starred_data.ipynb +++ b/notebooks/01. data_collect/get_starred_data.ipynb @@ -56,8 +56,10 @@ "outputs": [], "source": [ "dir_name = os.getenv('DIR_NAME')\n", + "base_path = f'../../data/processed/{dir_name}'\n", + "os.makedirs(base_path, exist_ok=True)\n", "\n", - "users_ids = pd.read_csv(f\"../../data/processed/{dir_name}/users_ids.csv\", encoding='latin1')\n", + "users_ids = pd.read_csv(f\"{base_path}/users_ids.csv\", encoding='latin1')\n", "users_ids = users_ids['user_id'].to_list()" ] }, @@ -76,14 +78,14 @@ "name": "stderr", "output_type": "stream", "text": [ - "Processing: 100%|██████████| 1729/1729 [45:27<00:00, 1.58s/it] " + "Processing: 100%|██████████| 1734/1734 [43:11<00:00, 1.49s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "final_data: {'user_id': [404506, 705308, 755840, 858200, 943711, 1241552, 1554715, 1572774, 1692858, 2129497, 3595515, 3806576, 3826227, 3955395, 4475142, 4643304, 4716778, 4808798, 5019560, 5045783, 6130991, 6144022, 6535422, 6688438, 6787828, 6823987, 6915391, 6969148, 6995340, 7068535, 7589719, 7609797, 7691358, 7803333, 8029526, 8167004, 8342748, 8362985, 8768392, 8783921, 8825214, 8840165, 8881986, 8969075, 8999039, 9043223, 9259308, 9362127, 9496788, 9781670, 9819921, 10023220, 10654641, 10864249, 10880501, 10888023, 10922795, 11079693, 11230500, 11247633, 11255406, 11262620, 11368305, 11584640, 11927641, 11987675, 12021468, 12033296, 12100397, 12243288, 12692919, 12964071, 13021754, 13303659, 13402312, 13482373, 13621066, 13769987, 13836260, 13968552, 13984100, 14114666, 14326204, 14907689, 14910228, 15047907, 15192264, 15213215, 15256665, 15413104, 16305023, 16611541, 17209308, 17267747, 17307013, 17637439, 17989477, 18194047, 18216969, 18285082, 18400142, 18415360, 18603314, 18709463, 19210598, 19254270, 19359776, 19366367, 19644754, 19816874, 20244168, 20360517, 20440015, 20488304, 20513587, 20571696, 20599605, 20662186, 20702024, 20819246, 20905674, 21008078, 21173712, 21192973, 21342696, 22245869, 22305507, 22327331, 22341964, 22344536, 22374063, 22597065, 22640209, 22657992, 23185608, 23555833, 23740775, 23740856, 24277044, 24395031, 24415579, 24765887, 24766978, 24827083, 24903262, 24928542, 24961647, 25220784, 25800161, 25843851, 25931668, 26120352, 26214872, 26558566, 26708649, 26844915, 27642985, 27733133, 27965287, 28258862, 28514526, 28735704, 28783718, 28985401, 29178934, 29462510, 29792912, 29806633, 30077420, 30090160, 30523874, 30528631, 30689866, 31000619, 31217604, 31237771, 31238878, 31242188, 31246918, 31260297, 31282507, 31408474, 31477051, 31759362, 31899027, 31945644, 32058262, 32066945, 32402003, 32514855, 32597978, 32665277, 32770980, 33702490, 33831855, 33861085, 33977992, 34401880, 34800399, 34924212, 35003387, 35046818, 35900188, 36237054, 36265803, 36325257, 36434948, 36505998, 36619381, 36881559, 37243873, 37326584, 37635729, 37686832, 37707479, 37825988, 38020305, 38070519, 38094400, 38292962, 38326420, 38478347, 38946066, 39172682, 39738870, 39951469, 40000916, 40174805, 40181269, 40224762, 40237204, 40593690, 40625547, 40658328, 41486295, 41967397, 41967811, 42138007, 42249792, 42285178, 42302155, 42326571, 42444957, 42467879, 42480265, 42523503, 42549629, 42754835, 43210563, 43370602, 43747467, 43821098, 43821186, 43821712, 43958695, 43994481, 44199686, 44291462, 44292931, 44563964, 44772199, 45265091, 45293066, 45578804, 45792465, 46070272, 46302322, 46322274, 46411490, 46556049, 46570027, 46673118, 47828211, 48277037, 48757536, 48864686, 48907382, 48980408, 49094323, 49195303, 49291509, 49428431, 49757028, 49800473, 50014667, 50020723, 50044807, 50153377, 50169396, 50483524, 50568515, 50595168, 50636981, 50638164, 50657023, 50747027, 51007331, 51121224, 51226601, 51425063, 51825398, 51890460, 51932935, 51958179, 52320920, 52324498, 52411224, 52431348, 52455921, 52500235, 52585849, 52595409, 52595419, 52595445, 52691990, 52712652, 52815019, 52857132, 52931687, 52966432, 53053984, 53153255, 53174794, 53215893, 53312861, 53468037, 53570550, 53784872, 53790917, 53791616, 54008441, 54041357, 54165291, 54271761, 54271987, 54272000, 54272062, 54285917, 54623535, 54830544, 54903338, 55026292, 55235902, 55366277, 55478805, 55548276, 55550145, 55765693, 55844517, 55860970, 55871338, 56188470, 56450813, 56542586, 56685064, 56694801, 56705157, 56709665, 56931285, 56935769, 56992852, 57046729, 57064616, 57067767, 57071122, 57417802, 57498621, 57590260, 57725103, 57901563, 57982422, 57997464, 58065381, 58298580, 58364586, 58486362, 58696746, 58832119, 59121880, 59767992, 59863398, 59915519, 59961857, 60569881, 60631114, 60866090, 61278473, 61432626, 61561058, 61727729, 61735196, 62499791, 62506418, 62618676, 62674418, 62728029, 62776977, 63150230, 63426852, 63527675, 63618438, 63649156, 63803044, 63875834, 63910629, 63913528, 63976153, 64093066, 64161845, 64174170, 64279855, 64314311, 64325526, 64354399, 64354602, 64646425, 64668677, 64691992, 64875718, 65103987, 65212955, 65242826, 65508138, 65548563, 66148694, 66243493, 66390370, 66472398, 66479526, 66551006, 66783101, 67241893, 67284022, 67377749, 67378869, 67404275, 67740598, 67766388, 67790866, 67807456, 67931254, 67968674, 67983375, 68120258, 68229913, 68234552, 68255287, 68370709, 68377505, 68445853, 68459412, 68553254, 69589722, 69644296, 69655550, 69784305, 69820794, 69867337, 70128803, 70213038, 70277279, 70918025, 70985406, 71283657, 71399799, 71434398, 71510847, 71522302, 71551874, 71612009, 71687136, 71780731, 71854573, 72145382, 72154018, 72201212, 72214855, 72233494, 72309855, 72340227, 72499602, 72518473, 72521774, 72710131, 72799525, 72815169, 72819474, 72821948, 72823756, 72931424, 73386872, 73468995, 73488484, 73528747, 73537499, 73652124, 73796385, 73997145, 74591655, 74727324, 74879760, 75274423, 75278898, 75330000, 75432726, 75454542, 75501289, 75740869, 75936360, 76013172, 76060004, 76119431, 76201386, 76396858, 76516206, 76517786, 76708188, 76743863, 76938257, 77080274, 77127716, 77356995, 77571208, 77933701, 77936944, 77968389, 77975777, 78048991, 78606977, 78730979, 78818106, 78858499, 79196702, 79327825, 79366484, 79388668, 79411877, 79787418, 79858184, 79871636, 79940003, 80075551, 80112944, 80123646, 80137734, 80226121, 80396703, 80470809, 80492657, 80789474, 80850402, 81576750, 81678247, 81724288, 81755943, 81818589, 81919768, 82066066, 82148347, 82153631, 82161016, 82271481, 82442020, 82827759, 82831720, 83153592, 83244925, 83403248, 83455817, 83553159, 83719160, 83808377, 84017505, 84182866, 84225261, 84314170, 84380815, 84548982, 84616944, 85138573, 85197739, 85250817, 85518166, 85911730, 86011531, 86047797, 86053915, 86129738, 86198523, 86366723, 86381944, 86890739, 86908936, 87189308, 87477436, 87478383, 87953252, 88016026, 88153755, 88205826, 88557261, 88653524, 88678823, 88732619, 89316477, 89344441, 89345427, 89379357, 89402675, 89664210, 89780156, 89780712, 89820377, 89900029, 90114095, 90267554, 90420166, 90422313, 90465858, 90636954, 90805554, 90893587, 91061958, 91198554, 91519924, 91666537, 91953966, 92016251, 92977776, 93037649, 93071845, 93186702, 93434626, 93527357, 93798765, 93864400, 93912102, 94174654, 94529661, 94588285, 94758938, 94769696, 94811573, 95338991, 95491894, 95547177, 95558305, 95737858, 95749720, 95983990, 96057681, 96112993, 96328449, 96380575, 96472895, 97433363, 97593079, 97907993, 97970232, 98024608, 98264322, 98719122, 99065313, 99265531, 99272123, 99678047, 99757118, 100477326, 100930639, 101146092, 101388488, 102383390, 102575507, 103176239, 103209710, 103361233, 103423713, 104297128, 104763211, 105211388, 105241871, 105989003, 106206000, 106533679, 107038187, 107197809, 107857536, 107879968, 108019442, 108148355, 108238845, 108373290, 108406340, 108551667, 109064412, 109345293, 109630558, 110171878, 110357194, 111236268, 111703423, 111966243, 111978180, 112618892, 112873951, 112904406, 114033195, 116220482, 116520003, 117580376, 117710430, 119706846, 119797490, 121355275, 121378751, 121976617, 122802517, 123736124, 123747730, 124932410, 125027659, 126192030, 127418194, 128046368, 128465540, 128728895, 129966675, 130066304, 130653731, 131586974, 132569657, 132749640, 133228881, 136461003, 141511728, 143124692, 145675987, 146567901, 149876997, 150170454, 152652673, 153447751, 159538875, 165147195], 'has_moz_owner': [True, True, True, False, True, False, True, True, True, False, False, True, True, True, True, True, True, True, True, True, True, True, True, True, False, True, False, True, False, False, False, False, True, True, True, True, True, True, True, True, False, False, False, True, True, False, False, False, False, False, True, False, True, True, True, True, False, True, False, True, True, False, False, True, False, True, True, True, True, False, False, False, True, False, False, True, False, True, True, False, True, False, True, True, False, True, True, False, False, False, True, False, False, True, False, True, True, False, True, True, True, True, True, True, True, True, True, False, True, False, False, True, True, True, True, True, True, False, True, True, True, True, True, False, True, True, False, False, True, False, False, True, False, False, True, True, True, True, False, True, False, True, False, True, False, False, False, True, False, True, True, False, True, False, True, True, True, False, True, True, False, False, False, True, True, True, False, True, False, False, True, False, True, True, True, True, True, True, True, False, False, True, False, False, True, True, True, True, False, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, False, True, False, True, True, True, True, False, True, False, False, False, True, True, True, True, True, True, False, False, False, False, False, True, True, True, True, True, False, True, False, True, True, False, False, True, False, False, True, True, True, True, True, True, False, True, True, True, False, True, True, False, True, False, True, True, True, True, True, False, False, True, True, True, True, False, False, False, False, False, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, False, True, False, False, True, True, False, False, True, True, True, False, True, False, False, False, False, True, False, True, True, True, True, False, True, False, True, True, False, False, False, True, True, True, True, True, True, True, True, True, True, True, False, True, True, False, True, True, False, False, True, True, True, False, False, True, False, False, True, True, True, False, True, True, False, True, True, True, False, True, False, False, True, False, True, False, True, False, False, True, True, True, False, True, False, True, True, True, True, True, False, True, True, False, True, True, False, False, True, False, False, True, True, True, False, True, True, False, True, True, True, False, True, False, False, True, True, False, True, False, False, True, False, True, False, True, True, False, True, False, True, True, False, False, True, False, False, True, True, False, False, False, True, False, True, False, False, True, True, False, True, False, True, True, True, True, False, True, True, True, False, False, True, True, False, True, True, False, False, True, True, True, False, True, True, True, False, True, True, False, True, True, True, False, False, True, True, True, False, False, True, False, True, True, False, True, True, True, False, False, False, True, False, True, True, False, True, True, True, True, True, False, True, True, True, True, True, False, False, True, True, True, True, False, False, True, True, True, False, True, True, True, True, True, True, False, True, True, True, False, False, True, False, True, True, False, False, True, True, True, True, True, True, False, False, True, True, True, True, True, True, True, False, False, True, True, False, True, True, True, True, True, True, True, True, False, True, False, True, False, True, False, True, False, False, False, True, True, False, False, True, False, True, False, True, True, True, True, False, False, False, True, True, True, False, False, True, False, False, True, False, False, True, False, False, True, False, True, False, True, True, True, True, True, True, True, False, False, True, False, True, True, True, True, False, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, False, False, True, True, False, False, False, True, False, True, True, False, True, True, False, True, True, False, False, True, True, False, False, False, True, True, False, True, False, True, False, True, True, True, True, False, True, False, True, False, True, False, True, False, True, True, False, True, True, True, False, True, False, False, True, True, True, True, True, False, True, False, False, False, False, False, True, True, True, True, True, True, False, False, False, True, False, True, True, True, True, True, True, True, True, True, False, False, True, False, False, False, False, False, True, True, False, False, True, False], 'fav_lang': ['Ruby', 'PHP', 'PHP', None, 'Ruby', 'Python', 'JavaScript', 'Java', 'PHP', 'TypeScript', 'C', 'JavaScript', None, 'PHP', 'JavaScript', 'JavaScript', 'Java', 'Python', 'JavaScript', 'JavaScript', 'PHP', 'JavaScript', 'Java', 'Groovy', 'PHP', 'Go', None, 'JavaScript', 'TypeScript', 'HTML', 'TypeScript', 'TypeScript', None, 'JavaScript', 'Java', 'PHP', None, None, 'Python', 'JavaScript', 'Python', None, 'PHP', 'JavaScript', 'PHP', 'C++', 'HTML', 'Python', 'Python', 'Rust', None, 'JavaScript', 'R', 'PHP', 'TypeScript', 'Python', None, 'PHP', 'Makefile', 'JavaScript', 'Java', 'Swift', 'JavaScript', 'Java', 'Dart', 'JavaScript', 'Go', 'JavaScript', 'JavaScript', 'Java', 'Java', 'Java', 'JavaScript', 'Dart', 'JavaScript', 'JavaScript', None, None, 'Java', 'PHP', 'PHP', 'Shell', 'C#', None, 'HTML', 'JavaScript', 'JavaScript', 'PHP', 'TypeScript', 'Java', None, 'Python', 'TypeScript', 'JavaScript', 'PHP', None, 'Java', None, 'Java', 'C#', 'JavaScript', None, None, 'Java', 'PHP', 'TypeScript', 'Kotlin', 'JavaScript', 'Python', 'Dart', 'CSS', 'Dart', None, 'TypeScript', 'JavaScript', 'Java', 'JavaScript', None, 'Java', 'Java', 'JavaScript', 'PHP', 'JavaScript', 'Java', 'TypeScript', 'PHP', 'Swift', 'Python', 'Python', 'TypeScript', 'HTML', 'Java', 'PHP', 'Go', 'JavaScript', None, 'JavaScript', None, None, 'Python', 'PHP', 'Java', 'HTML', 'JavaScript', 'TypeScript', 'Java', 'C#', None, None, None, 'PHP', 'C++', 'JavaScript', 'TypeScript', 'C#', 'JavaScript', 'Python', 'JavaScript', 'TypeScript', 'JavaScript', 'Python', 'PHP', 'Jupyter Notebook', 'Kotlin', None, 'JavaScript', 'Java', 'JavaScript', 'TypeScript', 'HTML', 'Java', 'JavaScript', None, 'JavaScript', 'Blade', 'JavaScript', 'JavaScript', None, 'JavaScript', 'JavaScript', 'HTML', None, 'Python', 'Python', 'PHP', 'PHP', 'Java', 'Kotlin', 'C#', 'PHP', 'JavaScript', 'Java', 'HTML', None, None, 'JavaScript', 'Python', None, None, 'TypeScript', 'Java', 'JavaScript', 'HTML', 'TypeScript', 'PHP', 'HTML', 'Java', 'Java', 'PHP', 'TypeScript', 'Dart', None, 'Go', 'Java', None, 'JavaScript', 'Kotlin', 'HTML', 'Java', 'HTML', 'Java', 'Dart', 'JavaScript', None, 'TypeScript', 'Java', 'JavaScript', 'Python', 'Java', 'JavaScript', 'JavaScript', 'C', 'JavaScript', 'Dart', 'Python', None, 'JavaScript', 'Vue', 'PHP', 'HTML', 'HTML', None, 'JavaScript', 'Java', 'PHP', 'Java', 'C#', 'PHP', 'Jupyter Notebook', 'Dart', 'JavaScript', 'Dart', 'Go', 'Java', 'Python', 'PHP', 'Dart', 'TypeScript', 'JavaScript', 'Kotlin', 'JavaScript', 'HTML', 'JavaScript', 'QML', 'PHP', 'PHP', None, 'HTML', 'HTML', 'C++', 'C#', 'HTML', 'Java', 'C#', None, None, 'Dart', 'JavaScript', 'TypeScript', 'TypeScript', 'Dart', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', None, 'Java', 'Java', 'Java', 'Java', 'JavaScript', 'TypeScript', 'HTML', 'Python', 'Dart', None, 'JavaScript', 'Java', 'Kotlin', 'CSS', 'Python', 'Java', 'Dart', 'JavaScript', 'TypeScript', 'TypeScript', 'HTML', 'Makefile', 'HTML', 'Astro', None, 'CSS', None, None, None, 'Dart', 'PHP', None, 'JavaScript', 'Vue', 'JavaScript', 'TypeScript', 'PHP', 'JavaScript', 'JavaScript', 'JavaScript', 'Java', 'TypeScript', 'HTML', 'Java', 'TypeScript', 'PHP', 'Kotlin', 'JavaScript', 'JavaScript', 'C++', 'TypeScript', None, 'Dart', 'PHP', 'Dart', None, 'C++', 'PHP', None, None, 'PHP', 'PHP', None, 'Dart', 'JavaScript', 'JavaScript', 'Dart', 'Java', 'PHP', 'JavaScript', 'Python', 'Java', 'HTML', 'Java', 'HTML', 'Java', None, 'JavaScript', 'Java', 'PHP', 'TypeScript', 'Python', 'JavaScript', 'JavaScript', None, 'C#', 'TypeScript', None, 'Python', 'Python', 'Go', 'TypeScript', 'Java', 'Java', 'JavaScript', 'Dart', None, 'CSS', 'JavaScript', None, None, 'CSS', None, 'Jupyter Notebook', None, 'HTML', 'Python', 'Python', 'Python', None, 'TypeScript', 'Dart', 'TypeScript', 'Go', None, None, 'HTML', None, 'Jupyter Notebook', None, 'JavaScript', 'Python', 'CSS', 'TypeScript', 'JavaScript', 'JavaScript', 'Java', 'Go', 'C++', 'PHP', None, None, 'JavaScript', 'JavaScript', 'Go', 'TypeScript', 'PHP', 'JavaScript', None, 'Python', 'Shell', 'HTML', 'TypeScript', 'TypeScript', None, 'JavaScript', 'PHP', None, 'SCSS', 'HTML', 'CSS', 'HTML', 'C#', None, 'Shell', 'JavaScript', None, 'Java', 'Python', 'PHP', 'TypeScript', None, 'Jupyter Notebook', None, 'Java', 'HTML', 'TypeScript', None, 'Java', 'CSS', 'Dart', 'JavaScript', None, 'Java', 'JavaScript', 'Python', 'HTML', 'HTML', 'Python', 'C++', 'TypeScript', 'TypeScript', 'HTML', 'Python', 'Java', None, None, 'HTML', None, 'JavaScript', 'C#', 'JavaScript', 'JavaScript', None, 'Shell', 'Vue', 'PHP', 'Python', 'HTML', 'JavaScript', 'Zig', 'HTML', 'JavaScript', 'JavaScript', None, 'Java', 'JavaScript', 'JavaScript', 'Ruby', 'Jupyter Notebook', 'JavaScript', None, 'Dart', None, 'Python', 'JavaScript', None, 'TypeScript', 'PHP', 'C', 'PHP', 'JavaScript', 'Dart', 'TypeScript', 'Java', 'Dart', 'JavaScript', 'JavaScript', None, 'TypeScript', 'HTML', 'JavaScript', 'TypeScript', 'Java', None, None, 'JavaScript', None, 'CSS', None, 'JavaScript', 'PHP', None, 'Python', 'HTML', 'CSS', 'TypeScript', 'Python', 'PHP', 'CSS', None, 'TypeScript', None, 'Python', 'JavaScript', 'PHP', 'C++', 'HTML', 'HTML', 'Java', 'Python', 'JavaScript', 'Go', 'TypeScript', None, 'CSS', 'JavaScript', None, 'JavaScript', 'JavaScript', 'JavaScript', 'Java', None, 'Blade', 'Java', 'JavaScript', 'JavaScript', 'Python', 'JavaScript', 'JavaScript', 'Java', 'TypeScript', 'Dart', 'Jupyter Notebook', None, None, 'HTML', None, 'CSS', 'HTML', 'Solidity', 'Java', 'JavaScript', 'PHP', 'Java', 'Dart', None, 'Java', 'Dockerfile', 'C', 'Python', 'JavaScript', 'JavaScript', None, 'PHP', None, 'JavaScript', 'HTML', 'Java', 'Java', 'HTML', 'JavaScript', 'Java', None, 'C', None, 'Java', None, 'JavaScript', None, 'Jupyter Notebook', 'PHP', 'Java', None, 'Java', 'PHP', 'HTML', 'Java', 'Java', 'HTML', 'HTML', 'Java', None, 'Java', None, 'Java', 'JavaScript', 'PHP', None, None, None, None, 'JavaScript', 'PHP', 'Java', None, 'Jupyter Notebook', None, 'Python', 'HTML', 'JavaScript', 'Swift', 'Java', None, None, None, 'TypeScript', None, 'JavaScript', None, 'Python', 'Dart', 'PHP', 'JavaScript', None, 'JavaScript', 'JavaScript', 'HTML', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', 'Svelte', 'Java', 'Java', None, 'JavaScript', 'JavaScript', 'Java', 'Java', None, 'JavaScript', 'TypeScript', 'JavaScript', 'JavaScript', 'C', None, 'Java', 'PHP', 'Kotlin', 'CSS', 'Java', 'TypeScript', 'TypeScript', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', 'Jupyter Notebook', 'HTML', 'Python', None, 'JavaScript', None, None, None, 'CSS', 'Dart', 'JavaScript', None, 'Java', 'TypeScript', 'TypeScript', 'JavaScript', 'HTML', None, 'HTML', None, 'HTML', None, 'Jupyter Notebook', 'Java', None, 'Python', 'Java', None, 'HTML', None, 'HTML', 'Java', 'Shell', 'JavaScript', 'HTML', 'JavaScript', 'Python', 'CSS', 'Python', 'HTML', 'TypeScript', 'HTML', 'CSS', 'Java', 'JavaScript', 'JavaScript', 'HTML', 'TypeScript', 'Java', 'HTML', 'EJS', 'JavaScript', 'PHP', 'Python', None, 'CSS', 'Python', 'HTML', 'HTML', None], 'fav_topic': ['accordion', 'php', 'php', 'git', None, None, 'machine-learning', None, 'php', 'typescript', 'css', 'javascript', 'cms', 'alibaba', 'react', 'api', None, 'python', 'javascript', 'android', 'php', 'machine-learning', None, 'demographics', 'application-wrapper', 'kubernetes', 'careers', 'api', 'react-native', 'careers', 'vue', 'careers', 'dart', 'browser', 'synced-settings', 'php', 'java', None, None, 'javascript', 'esmf', 'javascript', 'docker', 'mpesa', 'php', 'command-line', 'accordion', 'css', 'hacktoberfest', None, 'compiler', 'bypass', 'r', 'laravel', 'typescript', 'bpmn', 'hacking', 'api', 'climate', 'javascript', 'android', 'swift', 'css', 'java', 'flutter', 'javascript', 'hacktoberfest', 'css-questions', 'javascript', 'android', None, 'java', 'hacktoberfest', 'android', 'mozambique', 'android', 'awesome-list', 'hacktoberfest', 'android', 'laravel', 'python', 'docker', 'dotnet', None, None, 'bootstrap', None, None, 'ai-art', 'uber-clone', 'javascript', 'cisco', 'careers', 'education', 'framework', 'javascript', 'gamification', None, 'hacktoberfest', 'hacktoberfest', 'javascript', 'javascript', 'hacktoberfest', 'java', 'api', 'golang', 'android', 'react', 'php', 'android', 'animation', 'e-commerce', 'javascript', 'laravel', 'vue', 'java', 'javascript', 'google-cloud', 'java', None, 'laravel', 'wordpress', 'dicebear', 'framework', 'typescript', 'laravel', None, 'awesome-list', 'python', 'careers', 'apps', None, 'angular', 'go', 'vue', 'cordova', 'javascript', 'hacktoberfest', 'dataset', 'python', None, None, 'data-science', 'nextjs', 'careers', 'careers', 'create', None, 'books', 'hacktoberfest', 'data-science', 'careers', 'react', 'careers', 'asp-net-core', 'javascript', 'python', 'javascript', 'hacktoberfest', None, 'python', 'laravel', 'javascript', 'kotlin', None, None, None, 'next14', None, None, 'css3', 'atom', 'bootstrap', None, 'composer', 'application-realtime', 'python', 'software-testing', 'javascript', 'hacktoberfest', 'boostrap', 'blog-engine', 'machine-learning', None, None, 'laravel', 'android', 'android', None, 'mpesa', None, None, 'django', 'hacktoberfest', 'best-of', 'javascript', 'python', None, 'config', 'hacktoberfest', 'android', 'blockchain', None, 'hacktoberfest', 'activator', 'css', None, 'android', 'mpesa', 'css', 'flutter', 'animation', 'javascript', 'hacktoberfest', 'awesome', None, 'android', 'gratuito', None, 'bootstrap', None, 'aplicativo', 'hacktoberfest', 'tutorials', None, None, 'hacktoberfest', 'discord', 'java', 'hacktoberfest', 'javascript', 'bios', 'css', 'dart', 'angular', 'msisdn-validate', 'laravel', 'vue', None, 'bootstrap', 'material', 'api', 'javascript', 'java', 'api', None, None, 'vue', 'bootstrap4', 'flutter', 'nodejs', 'kotlin', 'cli', 'javascript', 'django', 'laravel', None, 'windows', 'react', 'android', 'react', None, 'express', 'react', None, 'cyber-security', None, 'lists', '100daysofcode', 'nodejs', 'c-sharp', 'calculator', None, 'c-sharp', 'nlw-06', 'react', 'flutter', 'android', 'expo', 'javascript', 'flutter', 'algorithm', 'formatter', 'hacktoberfest', None, 'design-system', None, None, None, None, 'css', 'drag-and-drop', 'api', 'applications', 'awesome-list', 'github', 'javascript', None, 'javascript', 'educational', 'blue-team', None, 'flutter', 'android', 'nodejs', 'docker', 'html', 'busybox', 'data-science', 'admin', 'security', 'css', None, None, None, 'flutter', 'laravel', 'data-analysis', 'react', None, 'authentication', 'framework', 'database', 'fullpage', 'react', 'vue', 'adminlte3', 'docker', None, 'android', 'golang-package', 'javascript', 'kotlin', 'synced-settings', None, None, 'vim', 'config', None, 'php', 'dart', 'css', 'cheat-fortnite-', 'challenge', 'hacktoberfest', None, 'php', 'imersao-java', 'awesome', 'flutter', 'hacktoberfest', 'hacktoberfest', 'desktop', None, None, 'python', 'github', 'java', 'codeinthedark', 'opengl', 'blockchain', 'spring-boot', 'mpesa', 'aws', 'java', 'laravel', 'backend', 'machine-learning', 'css', 'react', None, 'blazor', 'javascript', 'betty', 'deep-learning', 'awesome', 'fga', 'components', 'hacktoberfest', 'java', 'mozambique', 'flutter', 'github', None, 'android', None, None, 'css3', 'javascript', None, 'war-thunder-aimbot', None, None, 'aix', 'security', 'openai-api', 'nodejs', None, 'typescript', 'awesome-react-stuff', None, 'hacktoberfest', 'javascript', None, 'datascience', 'hacktoberfest', None, 'django', 'framework', 'security', None, 'codeinthedark', None, '2d', 'c', None, None, 'best-practices', None, 'react', 'go', 'e2payments', 'laravel', 'react', 'javascript', 'html', 'macos', None, 'components', 'typescript', 'javascript', 'hacktoberfest', 'laravel', 'applications', 'css', None, None, 'adminlte', 'create', 'admin', 'linux', 'react', 'guidelines', 'java', None, None, 'mpesa', 'exploitation', None, 'git', None, None, 'bash', 'books', None, 'advent-of-code', None, 'clean-architecture', 'awesome-list', None, None, None, 'config', None, 'algorithm-visualisation', 'cpp', None, 'javascript', None, 'curso-em-video', 'hacktoberfest', 'css', 'ruby', None, 'git', None, 'book', 'expo', 'react', 'calculations', None, 'vuejs', None, None, 'coding-in-community', 'hacktoberfest', 'bun', 'curso', 'react', 'react', 'android', None, 'animated', 'canvas', None, 'binary', 'react-native', 'javascript', 'api', 'hacktoberfest', 'deep-learning', 'typescript', 'config', None, None, None, 'face-detection', 'machine-learning', 'hacktoberfest', 'd3js', 'annotations', 'android', 'books', 'javascript', 'api', 'react', None, 'ai-images', 'education', 'boostrap', 'hacktoberfest', None, 'javascript', 'api', None, None, 'awesome-list', 'php', 'awesome', 'django', 'react', 'brands', 'gis', 'css3', 'laravel', None, 'cheat-sheet', 'typescript', 'algorithm', None, 'java', 'php', None, 'javascript', None, None, 'api', 'portfolio-site', 'hacktoberfest', None, 'community', 'react', None, 'javascript', 'java', 'begginers', None, None, 'config', 'advance-ecommerce-project', 'collaborate', 'php', 'config', 'hacktoberfest', 'javascript', 'react', 'collaborate', 'android', 'flutter', 'python', 'github', 'hacktoberfest', 'curso', None, None, 'capture', 'git', None, 'coming-soon-page', None, None, 'flutter', 'aws', None, None, None, 'awesome', 'python', 'typescript', 'nextjs', 'config', 'awesome-list', None, 'css3', None, None, 'bootstrap4', None, 'java', 'javascript', 'editor', 'config', None, 'hacktoberfest', 'best-practices', 'javascript', 'cartography', 'excel', 'android', None, 'java17', 'attachment', None, 'crud', None, 'bootstrap5', 'portfolio', 'android', None, None, 'tutorial', None, 'recognition', None, 'bash-configuration', None, None, 'appsec', 'javascript', 'desktop', None, 'config', 'data-science', None, 'amazon', None, 'javascript', 'ios', None, 'javascript', 'animations', 'hacktoberfest', 'typescript', 'intern', 'typescript', 'awesome', 'github-config', None, 'deploy', 'javascript', 'game-development', 'javascript', 'aws-ses', 'javascript', 'artificial-intelligence', 'hacktoberfest', None, 'beginner-project', 'component', None, 'hacktoberfest', None, 'component', 'javascript', 'brasil', None, 'hacktoberfest', 'adhan', 'mozambique', 'css', None, 'github', None, 'projetos-em-java', None, 'declarative', None, 'java', 'react', None, 'game', 'cheat-sheet', None, 'dio', 'design-system', 'maintenance-page', 'javascript', 'brute-force', None, None, 'css3', None, None, 'dart', 'awesome-list', None, 'hacktoberfest', 'chat', 'agnus', 'hacktoberfest', 'gustavoguanabara', None, None, 'awesome-list', None, None, 'ai', None, 'angular-roadmap', None, 'java', None, 'e2payments', 'algorithms', 'rocketseat', 'reactjs', 'linux', 'sms', 'curso', 'mozambique', 'github', None, None, None, 'android', None, 'html-css', None, 'books', None, None, None, None, 'curso', None, None, None, 'javascript', 'config', 'config', 'django', 'curso', None, 'curso']}\n" + "final_data: {'user_id': [404506, 705308, 755840, 858200, 943711, 1241552, 1554715, 1572774, 1692858, 2129497, 2580338, 3595515, 3806576, 3826227, 3955395, 4475142, 4643304, 4716778, 4808798, 5019560, 5045783, 6130991, 6144022, 6535422, 6688438, 6787828, 6823987, 6915391, 6969148, 6995340, 7068535, 7589719, 7609797, 7691358, 7803333, 8029526, 8167004, 8342748, 8362985, 8768392, 8783921, 8825214, 8840165, 8881986, 8969075, 8999039, 9043223, 9259308, 9362127, 9496788, 9781670, 9819921, 10023220, 10654641, 10864249, 10880501, 10888023, 10922795, 11079693, 11230500, 11247633, 11255406, 11262620, 11368305, 11584640, 11927641, 11987675, 12021468, 12033296, 12100397, 12243288, 12692919, 12964071, 13021754, 13303659, 13402312, 13482373, 13621066, 13769987, 13836260, 13968552, 13984100, 14114666, 14326204, 14907689, 14910228, 15047907, 15192264, 15202121, 15206337, 15213215, 15256665, 15413104, 16305023, 16611541, 17209308, 17267747, 17307013, 17637439, 17989477, 18194047, 18216969, 18285082, 18400142, 18415360, 18603314, 18709463, 19210598, 19254270, 19359776, 19366367, 19644754, 19816874, 20244168, 20360517, 20440015, 20488304, 20513587, 20571696, 20599605, 20662186, 20702024, 20819246, 20905674, 21008078, 21173712, 21192973, 21342696, 22245869, 22305507, 22327331, 22341964, 22344536, 22374063, 22524099, 22597065, 22640209, 22657992, 23185608, 23555833, 23740775, 23740856, 24277044, 24395031, 24415579, 24765887, 24766978, 24827083, 24903262, 24928542, 24961647, 25220784, 25800161, 25843851, 25931668, 26120352, 26214872, 26558566, 26708649, 26844915, 27642985, 27733133, 27965287, 28258862, 28514526, 28735704, 28783718, 28985401, 29178934, 29462510, 29792912, 29806633, 30077420, 30090160, 30523874, 30528631, 30689866, 31000619, 31217604, 31237771, 31238878, 31242188, 31246918, 31260297, 31282507, 31408474, 31477051, 31759362, 31899027, 31945644, 32058262, 32066945, 32402003, 32514855, 32597978, 32665277, 32770980, 33702490, 33831855, 33861085, 33977992, 34401880, 34800399, 34924212, 35003387, 35046818, 35900188, 36237054, 36265803, 36325257, 36434948, 36505998, 36619381, 36881559, 37243873, 37326584, 37635729, 37686832, 37707479, 37825988, 38020305, 38070519, 38094400, 38292962, 38326420, 38478347, 38946066, 39172682, 39738870, 39951469, 40000916, 40174805, 40181269, 40224762, 40237204, 40593690, 40625547, 40658328, 41486295, 41967397, 41967811, 42138007, 42249792, 42285178, 42302155, 42326571, 42444957, 42467879, 42480265, 42523503, 42549629, 42754835, 43210563, 43370602, 43747467, 43821098, 43821186, 43821712, 43958695, 43994481, 44199686, 44291462, 44292931, 44563964, 44772199, 45265091, 45293066, 45578804, 45792465, 46070272, 46302322, 46322274, 46411490, 46556049, 46570027, 46673118, 47828211, 48277037, 48757536, 48864686, 48907382, 48980408, 49094323, 49195303, 49291509, 49428431, 49757028, 49800473, 50014667, 50020723, 50044807, 50153377, 50169396, 50483524, 50568515, 50595168, 50636981, 50638164, 50657023, 50747027, 51007331, 51121224, 51226601, 51425063, 51825398, 51890460, 51932935, 51958179, 52320920, 52324498, 52411224, 52431348, 52455921, 52500235, 52585849, 52595409, 52595419, 52595445, 52691990, 52712652, 52815019, 52857132, 52931687, 52966432, 53053984, 53153255, 53174794, 53215893, 53312861, 53468037, 53570550, 53784872, 53790917, 53791616, 54008441, 54041357, 54165291, 54271761, 54271987, 54272000, 54272062, 54285917, 54623535, 54830544, 54903338, 55026292, 55235902, 55366277, 55478805, 55548276, 55550145, 55765693, 55844517, 55860970, 55871338, 56188470, 56450813, 56542586, 56685064, 56694801, 56705157, 56709665, 56931285, 56935769, 56992852, 57046729, 57064616, 57067767, 57071122, 57417802, 57498621, 57590260, 57725103, 57901563, 57982422, 57997464, 58065381, 58298580, 58364586, 58486362, 58696746, 58832119, 59062594, 59121880, 59767992, 59863398, 59915519, 59961857, 60569881, 60631114, 60866090, 61278473, 61432626, 61561058, 61727729, 61735196, 62499791, 62506418, 62618676, 62674418, 62728029, 62776977, 63150230, 63426852, 63527675, 63618438, 63649156, 63803044, 63875834, 63910629, 63913528, 63976153, 64093066, 64161845, 64174170, 64279855, 64314311, 64325526, 64354399, 64354602, 64646425, 64668677, 64691992, 64875718, 65103987, 65212955, 65242826, 65508138, 65548563, 66148694, 66243493, 66390370, 66472398, 66479526, 66551006, 66783101, 67241893, 67284022, 67377749, 67378869, 67404275, 67740598, 67766388, 67790866, 67807456, 67931254, 67968674, 67983375, 68120258, 68229913, 68234552, 68255287, 68370709, 68377505, 68445853, 68459412, 68553254, 69146181, 69589722, 69644296, 69655550, 69784305, 69820794, 69867337, 70128803, 70213038, 70277279, 70918025, 70985406, 71283657, 71399799, 71434398, 71510847, 71522302, 71551874, 71612009, 71687136, 71780731, 71854573, 72145382, 72154018, 72201212, 72214855, 72233494, 72309855, 72340227, 72499602, 72518473, 72521774, 72710131, 72799525, 72815169, 72819474, 72821948, 72823756, 72931424, 73386872, 73468995, 73488484, 73528747, 73537499, 73652124, 73796385, 73997145, 74556942, 74591655, 74727324, 74879760, 75274423, 75278898, 75330000, 75432726, 75454542, 75501289, 75740869, 75936360, 76013172, 76060004, 76119431, 76201386, 76396858, 76516206, 76517786, 76708188, 76743863, 76938257, 77080274, 77127716, 77356995, 77571208, 77933701, 77936944, 77968389, 77975777, 78048991, 78606977, 78730979, 78818106, 78858499, 79196702, 79327825, 79366484, 79388668, 79411877, 79787418, 79858184, 79871636, 79940003, 80075551, 80112944, 80123646, 80137734, 80226121, 80396703, 80470809, 80492657, 80789474, 80850402, 81576750, 81678247, 81724288, 81755943, 81818589, 81919768, 82066066, 82148347, 82153631, 82161016, 82271481, 82442020, 82827759, 82831720, 83153592, 83244925, 83403248, 83455817, 83553159, 83719160, 83808377, 84017505, 84182866, 84225261, 84314170, 84380815, 84548982, 84616944, 85138573, 85197739, 85250817, 85518166, 85911730, 86011531, 86047797, 86053915, 86129738, 86198523, 86366723, 86381944, 86890739, 86908936, 87189308, 87477436, 87478383, 87953252, 88016026, 88153755, 88205826, 88557261, 88678823, 88732619, 89316477, 89321911, 89344441, 89345427, 89379357, 89402675, 89664210, 89780156, 89780712, 89820377, 89900029, 90114095, 90267554, 90420166, 90422313, 90465858, 90636954, 90805554, 90893587, 91061958, 91198554, 91519924, 91666537, 91953966, 92016251, 92977776, 93037649, 93071845, 93186702, 93434626, 93527357, 93798765, 93864400, 93912102, 94174654, 94529661, 94588285, 94758938, 94769696, 94811573, 95338991, 95491894, 95547177, 95737858, 95749720, 95983990, 96057681, 96112993, 96328449, 96380575, 96472895, 97433363, 97593079, 97907993, 97970232, 98024608, 98264322, 98719122, 99065313, 99265531, 99272123, 99678047, 99757118, 100477326, 100930639, 101146092, 101388488, 102383390, 102575507, 103176239, 103209710, 103361233, 103423713, 104297128, 104763211, 105211388, 105241871, 105989003, 106206000, 106533679, 107038187, 107197809, 107857536, 107879968, 108019442, 108148355, 108238845, 108373290, 108551667, 109064412, 109345293, 109630558, 110171878, 110357194, 111236268, 111703423, 111966243, 111978180, 112618892, 112873951, 112904406, 114033195, 116220482, 116520003, 117580376, 117710430, 119706846, 119797490, 121355275, 121378751, 121976617, 122802517, 122971587, 123736124, 123747730, 124932410, 125027659, 126192030, 127418194, 128046368, 128465540, 128728895, 129966675, 130066304, 130653731, 131586974, 132569657, 132749640, 133228881, 134437448, 136461003, 141511728, 143124692, 145675987, 146567901, 149876997, 150170454, 152652673, 153447751, 159538875, 165147195], 'has_moz_owner': [True, True, True, False, True, False, True, True, True, False, False, False, True, True, True, True, True, True, True, True, True, True, True, True, True, False, True, False, True, False, False, False, False, True, True, True, True, True, True, True, True, False, False, False, True, True, False, False, False, False, False, True, False, True, True, True, True, False, True, False, True, True, False, False, True, False, True, True, True, True, False, False, False, True, False, False, True, False, True, True, False, True, False, True, True, False, True, True, False, False, False, False, False, True, False, False, True, False, True, True, False, True, True, True, True, True, True, True, True, True, False, True, False, False, True, True, True, True, True, True, False, True, True, True, True, True, False, True, True, False, False, True, False, False, True, True, False, False, True, True, True, True, False, True, False, True, False, True, False, False, False, True, False, True, True, False, True, False, True, True, True, False, True, True, False, False, False, True, True, True, False, True, False, False, True, False, True, True, True, True, True, True, True, False, False, True, False, False, True, True, True, True, False, True, True, True, False, True, True, True, True, True, True, True, True, True, False, True, False, True, False, True, True, True, True, False, True, False, False, False, True, True, True, True, True, True, False, False, False, False, False, True, True, True, True, True, False, True, False, True, True, False, False, True, False, False, True, True, True, True, True, True, True, True, True, True, False, True, True, False, True, False, True, True, True, True, True, False, False, True, True, True, True, False, False, False, False, False, True, True, True, True, True, True, True, True, True, True, False, True, True, True, True, True, True, False, True, False, True, False, False, True, True, False, False, True, True, True, False, True, False, False, False, False, True, False, True, True, True, True, False, True, False, True, True, False, False, False, True, True, True, True, True, True, True, True, True, True, True, False, True, True, False, True, True, False, False, True, True, True, False, False, True, False, False, True, True, True, False, True, True, False, True, True, True, False, True, False, False, True, True, True, False, True, False, False, True, True, True, False, True, False, True, True, True, True, True, True, False, True, True, False, True, True, False, False, True, False, False, True, True, True, False, True, True, False, True, True, True, False, True, False, False, True, True, False, True, False, False, True, False, True, False, True, True, False, True, False, True, True, False, False, True, False, False, True, True, False, False, False, True, False, True, False, False, True, True, False, True, False, True, True, True, True, False, True, True, False, True, False, False, True, True, False, True, True, False, False, True, True, True, False, True, True, True, False, True, True, False, True, True, True, False, False, True, True, True, False, False, True, False, True, True, False, True, True, True, False, False, False, True, False, True, True, True, False, True, True, True, True, True, False, True, True, True, True, True, False, False, True, True, True, True, False, False, True, True, True, False, True, True, True, True, True, True, False, True, True, True, False, False, True, False, True, True, False, False, True, True, True, True, True, True, False, False, True, True, True, True, True, True, True, False, False, True, True, False, True, True, True, True, True, True, True, True, False, True, False, True, False, True, False, True, False, False, False, True, True, False, False, True, False, True, False, True, True, True, True, False, False, False, True, True, True, False, False, True, False, True, False, False, False, True, False, False, True, False, True, False, True, True, True, True, True, True, True, False, False, True, False, True, True, True, True, False, True, True, False, True, True, True, True, True, True, True, True, True, True, True, True, False, False, False, True, False, False, False, True, False, True, True, False, True, True, False, True, True, False, False, True, True, False, False, False, True, True, False, True, False, True, False, True, True, True, True, False, True, False, True, False, True, False, True, False, True, True, False, True, True, False, True, False, False, True, True, True, True, True, False, True, False, False, False, False, False, True, True, True, True, True, True, False, False, False, False, True, False, True, True, True, True, True, True, True, True, True, False, False, True, True, False, False, False, False, False, True, True, False, False, True, False], 'fav_lang': ['Ruby', 'PHP', 'PHP', 'TypeScript', 'Ruby', 'Python', 'JavaScript', 'Java', 'PHP', 'TypeScript', 'Python', 'C', 'JavaScript', None, 'PHP', 'JavaScript', 'JavaScript', 'Java', 'Python', 'JavaScript', 'JavaScript', 'PHP', 'JavaScript', 'Java', 'Groovy', 'PHP', 'Go', None, 'JavaScript', 'TypeScript', 'HTML', 'TypeScript', 'TypeScript', None, 'JavaScript', 'Java', 'PHP', None, None, 'Python', 'JavaScript', 'Python', None, 'TypeScript', 'JavaScript', 'PHP', 'C++', 'HTML', 'Python', 'Python', 'Rust', None, 'JavaScript', 'R', 'PHP', 'TypeScript', 'Python', None, 'PHP', 'Makefile', 'JavaScript', 'Java', 'Swift', 'JavaScript', 'Java', 'Dart', 'JavaScript', 'Go', 'JavaScript', 'JavaScript', 'Java', 'Java', 'Java', 'JavaScript', 'Dart', 'JavaScript', 'JavaScript', None, None, 'Java', 'PHP', 'PHP', 'Shell', 'C#', None, 'HTML', 'JavaScript', 'JavaScript', 'Java', 'Python', 'PHP', 'TypeScript', 'Java', None, 'Python', 'TypeScript', 'JavaScript', 'PHP', None, 'Java', None, 'Java', 'C#', 'JavaScript', None, None, 'Java', 'PHP', 'TypeScript', 'Kotlin', 'JavaScript', 'Python', 'Dart', 'CSS', 'Dart', None, 'TypeScript', 'TypeScript', 'Java', 'JavaScript', None, 'Java', 'Java', 'JavaScript', 'PHP', 'JavaScript', 'Java', 'TypeScript', 'PHP', 'Swift', 'Python', 'Python', 'TypeScript', 'HTML', 'HTML', 'Java', 'PHP', 'Go', 'JavaScript', None, 'JavaScript', None, None, 'Python', 'PHP', 'Java', 'JavaScript', 'JavaScript', 'TypeScript', 'Java', 'C#', None, None, None, 'PHP', 'C++', 'JavaScript', 'TypeScript', 'C#', 'JavaScript', 'Python', 'JavaScript', 'TypeScript', 'JavaScript', 'Python', 'PHP', 'Jupyter Notebook', 'Kotlin', None, 'JavaScript', 'Java', 'JavaScript', 'TypeScript', 'HTML', 'Java', 'JavaScript', None, 'JavaScript', 'Blade', 'JavaScript', 'JavaScript', None, 'JavaScript', 'JavaScript', 'HTML', None, 'Python', 'Python', 'PHP', 'PHP', 'Java', 'Kotlin', 'C#', 'PHP', 'JavaScript', 'Java', 'HTML', None, None, 'JavaScript', 'Python', None, None, 'TypeScript', 'Java', 'JavaScript', 'HTML', 'TypeScript', 'PHP', 'HTML', 'Java', 'Java', 'PHP', 'TypeScript', 'Dart', None, 'Go', 'Java', None, 'JavaScript', 'Kotlin', 'HTML', 'Java', 'HTML', 'Java', 'Dart', 'JavaScript', None, 'TypeScript', 'Java', 'JavaScript', 'Python', 'Java', 'JavaScript', 'JavaScript', 'C', 'JavaScript', 'Dart', 'Python', None, 'JavaScript', 'Vue', 'PHP', 'HTML', 'HTML', None, 'JavaScript', 'Java', 'PHP', 'Java', 'C#', 'PHP', 'HTML', 'Dart', 'JavaScript', 'Dart', 'Go', 'Java', 'Python', 'PHP', 'Dart', 'TypeScript', 'JavaScript', 'Kotlin', 'JavaScript', 'HTML', 'JavaScript', 'QML', 'PHP', 'PHP', None, 'HTML', 'HTML', 'C++', 'C#', 'HTML', 'Java', 'C#', None, None, 'Dart', 'JavaScript', 'TypeScript', 'TypeScript', 'Dart', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', None, 'Java', 'Java', 'Java', 'Java', 'JavaScript', 'TypeScript', 'HTML', 'Python', 'Dart', None, 'JavaScript', 'Java', 'Kotlin', 'CSS', 'Python', 'Java', 'Dart', 'JavaScript', 'TypeScript', 'TypeScript', 'HTML', 'Makefile', 'HTML', 'Astro', None, 'CSS', None, None, None, 'Dart', 'PHP', None, 'JavaScript', 'Vue', 'JavaScript', 'TypeScript', 'PHP', 'JavaScript', 'JavaScript', 'JavaScript', 'Java', 'TypeScript', 'HTML', 'Java', 'TypeScript', 'PHP', 'Kotlin', 'JavaScript', 'JavaScript', 'C++', 'TypeScript', None, 'Dart', 'PHP', 'Dart', None, 'C++', 'PHP', None, None, 'PHP', 'PHP', None, 'Dart', 'JavaScript', 'JavaScript', 'Dart', 'Java', 'PHP', 'JavaScript', 'Python', 'Java', 'HTML', 'Java', 'HTML', 'Java', None, 'JavaScript', 'Java', 'PHP', 'Go', 'Python', 'JavaScript', 'JavaScript', None, 'C#', 'TypeScript', None, 'Python', 'Python', 'Go', 'TypeScript', None, 'Java', 'Java', 'JavaScript', 'Dart', 'JavaScript', 'CSS', 'JavaScript', None, None, 'CSS', None, 'R', None, 'HTML', 'Python', 'Python', 'Python', None, 'TypeScript', 'Dart', 'TypeScript', 'Go', None, None, 'HTML', None, 'Jupyter Notebook', None, 'JavaScript', 'Python', 'CSS', 'TypeScript', 'JavaScript', 'JavaScript', 'Java', 'Go', 'C++', 'PHP', None, None, 'JavaScript', 'JavaScript', 'Go', 'TypeScript', 'PHP', 'JavaScript', None, 'Python', 'Shell', 'HTML', 'TypeScript', 'TypeScript', None, 'JavaScript', 'PHP', None, 'SCSS', 'HTML', 'CSS', 'HTML', 'C#', None, 'Shell', 'JavaScript', None, 'Java', 'Python', 'PHP', 'TypeScript', None, 'Jupyter Notebook', None, 'Java', 'HTML', 'Java', 'TypeScript', None, 'Java', 'CSS', 'Dart', 'JavaScript', 'JavaScript', 'Java', 'JavaScript', 'Python', 'HTML', 'HTML', 'Python', 'C++', 'TypeScript', 'TypeScript', 'HTML', 'Python', 'Java', None, None, 'HTML', None, 'JavaScript', 'C#', 'JavaScript', 'JavaScript', None, 'Shell', 'Vue', 'PHP', 'Python', 'HTML', 'JavaScript', 'TypeScript', 'HTML', 'JavaScript', 'JavaScript', None, 'Java', 'JavaScript', 'JavaScript', 'Ruby', 'Jupyter Notebook', 'JavaScript', None, 'Python', 'Dart', None, 'Python', 'JavaScript', None, 'TypeScript', 'PHP', 'C', 'PHP', 'JavaScript', 'Dart', 'TypeScript', 'Java', 'Dart', 'JavaScript', 'JavaScript', 'Java', 'TypeScript', 'HTML', 'JavaScript', 'TypeScript', 'Java', None, None, 'JavaScript', None, 'CSS', None, 'JavaScript', 'PHP', None, 'Python', 'HTML', 'CSS', 'TypeScript', 'Python', 'PHP', 'CSS', None, 'TypeScript', None, 'Python', 'JavaScript', 'PHP', 'C++', 'HTML', 'HTML', 'Java', 'Python', 'JavaScript', 'Go', 'TypeScript', None, 'CSS', 'JavaScript', None, 'JavaScript', 'JavaScript', 'JavaScript', 'Java', None, 'Blade', 'Java', 'JavaScript', 'JavaScript', 'Python', 'JavaScript', 'JavaScript', 'Java', 'TypeScript', 'Dart', 'Python', None, 'Python', 'HTML', None, 'CSS', 'HTML', 'Solidity', 'Java', 'JavaScript', 'PHP', 'Java', 'Dart', None, 'Java', 'Dockerfile', 'C', 'Python', 'JavaScript', None, None, 'PHP', None, 'JavaScript', 'HTML', 'Java', 'Java', 'HTML', 'JavaScript', 'Java', None, 'C', 'Java', None, 'JavaScript', 'HTML', None, 'Jupyter Notebook', 'PHP', 'Java', None, 'Java', 'PHP', 'HTML', 'Java', 'Java', 'HTML', 'HTML', 'Java', None, 'Java', None, 'Java', 'JavaScript', 'PHP', None, None, None, None, 'JavaScript', 'PHP', 'Java', None, 'Jupyter Notebook', None, 'Python', 'HTML', 'JavaScript', 'Swift', 'Java', 'JavaScript', None, None, 'TypeScript', None, 'JavaScript', None, 'Dart', 'PHP', 'JavaScript', None, 'JavaScript', 'JavaScript', 'HTML', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', 'Svelte', 'Java', 'Java', None, 'JavaScript', 'JavaScript', 'Java', 'Java', None, 'JavaScript', 'TypeScript', 'JavaScript', 'JavaScript', 'Jupyter Notebook', None, 'Java', 'PHP', 'Kotlin', 'CSS', 'Java', 'TypeScript', 'TypeScript', 'JavaScript', 'TypeScript', 'JavaScript', 'Java', 'Jupyter Notebook', 'HTML', 'TypeScript', None, 'JavaScript', None, 'CSS', None, 'Dart', 'JavaScript', None, None, 'TypeScript', 'TypeScript', 'JavaScript', 'HTML', None, 'HTML', None, 'HTML', None, 'Jupyter Notebook', 'Java', None, 'Python', 'Java', None, 'HTML', None, 'HTML', 'Java', 'Python', None, 'JavaScript', 'HTML', 'JavaScript', 'Python', 'CSS', 'Python', 'HTML', 'TypeScript', 'HTML', 'CSS', 'Java', 'JavaScript', 'JavaScript', 'HTML', 'Python', 'Java', 'Java', 'Java', 'EJS', 'JavaScript', 'PHP', 'Python', None, 'CSS', 'Python', 'HTML', 'HTML', None], 'fav_topic': ['accordion', 'php', 'php', 'autocomplete', None, None, 'machine-learning', None, 'php', 'typescript', 'hacktoberfest', 'css', 'javascript', 'cms', 'alibaba', 'react', 'api', None, 'python', 'javascript', 'android', 'php', 'machine-learning', None, 'demographics', 'application-wrapper', 'kubernetes', 'careers', 'api', 'react-native', 'careers', 'vue', 'careers', 'dart', 'browser', 'synced-settings', 'php', 'java', None, None, 'javascript', 'esmf', 'javascript', 'font', 'mpesa', 'php', 'command-line', 'accordion', 'css', 'hacktoberfest', None, 'compiler', 'bypass', 'r', 'laravel', 'typescript', 'bpmn', 'hacking', 'api', 'climate', 'javascript', 'android', 'swift', 'css', 'java', 'flutter', 'javascript', 'hacktoberfest', 'css-questions', 'javascript', 'android', None, 'java', 'hacktoberfest', 'android', 'mozambique', 'android', 'awesome-list', 'hacktoberfest', 'android', 'laravel', 'python', 'docker', 'dotnet', None, None, 'bootstrap', None, None, 'remote-sensing', None, 'ai-art', 'uber-clone', 'javascript', 'cisco', 'careers', 'education', 'framework', 'javascript', 'gamification', None, 'hacktoberfest', 'hacktoberfest', 'javascript', 'javascript', 'hacktoberfest', 'java', 'api', 'golang', 'android', 'react', 'php', 'android', 'animation', 'e-commerce', 'javascript', 'laravel', 'vue', 'java', 'javascript', 'google-cloud', 'java', None, 'laravel', 'wordpress', 'dicebear', 'framework', 'typescript', 'laravel', None, 'awesome-list', 'python', 'careers', 'apps', None, None, 'angular', 'go', 'vue', 'cordova', 'javascript', 'hacktoberfest', 'dataset', 'python', None, None, 'angular', 'nextjs', 'careers', 'careers', 'create', None, 'books', 'hacktoberfest', 'data-science', 'careers', 'react', 'careers', 'asp-net-core', 'javascript', 'python', 'javascript', 'hacktoberfest', None, 'python', 'laravel', 'javascript', 'kotlin', None, None, None, 'next14', None, None, 'css3', 'atom', 'bootstrap', None, 'composer', 'application-realtime', 'python', 'software-testing', 'javascript', 'hacktoberfest', 'boostrap', 'blog-engine', 'machine-learning', None, None, 'laravel', 'android', 'android', None, 'mpesa', None, None, 'django', 'hacktoberfest', 'best-of', 'javascript', 'python', None, 'config', 'hacktoberfest', 'android', 'blockchain', None, 'hacktoberfest', 'activator', 'css', None, 'android', 'mpesa', 'css', 'flutter', 'animation', 'javascript', 'hacktoberfest', 'awesome', None, 'android', 'gratuito', None, 'bootstrap', None, 'aplicativo', 'hacktoberfest', 'tutorials', None, None, 'hacktoberfest', 'discord', 'java', 'hacktoberfest', 'javascript', 'bios', 'css', 'dart', 'angular', 'msisdn-validate', 'laravel', 'vue', None, 'bootstrap', 'material', 'api', 'javascript', 'java', 'api', None, None, 'vue', 'bootstrap4', 'flutter', 'nodejs', 'kotlin', 'cli', 'javascript', 'django', 'laravel', None, 'windows', 'react', 'android', 'react', None, 'express', 'react-native', None, 'cyber-security', None, 'lists', '100daysofcode', 'nodejs', 'c-sharp', 'calculator', None, 'c-sharp', 'nlw-06', 'react', 'flutter', 'android', 'expo', 'javascript', 'flutter', 'algorithm', 'formatter', 'hacktoberfest', None, 'design-system', None, None, None, None, 'css', 'drag-and-drop', 'api', 'applications', 'awesome-list', 'github', 'javascript', None, 'javascript', 'educational', 'blue-team', None, 'flutter', 'android', 'nodejs', 'open-source', 'html', 'busybox', 'data-science', 'admin', 'security', 'css', None, None, None, 'flutter', 'laravel', 'data-analysis', 'react', None, 'authentication', 'framework', 'database', 'fullpage', 'react', 'vue', 'adminlte3', 'docker', None, 'android', 'golang-package', 'javascript', 'kotlin', 'synced-settings', None, None, 'vim', 'config', None, 'php', 'dart', 'css', 'cheat-fortnite-', 'challenge', 'hacktoberfest', None, 'php', 'imersao-java', 'awesome', 'flutter', 'hacktoberfest', 'hacktoberfest', 'desktop', None, None, 'python', 'github', 'java', 'codeinthedark', 'opengl', 'blockchain', 'spring-boot', 'mpesa', 'aws', 'java', 'laravel', 'samora-lang', 'machine-learning', 'css', 'react', None, 'blazor', 'javascript', 'betty', 'deep-learning', 'awesome', 'fga', 'components', 'algorithms', 'hacktoberfest', 'java', 'mozambique', 'flutter', 'python', None, 'android', None, None, 'css3', 'javascript', 'analysis', 'war-thunder-aimbot', None, None, 'aix', 'security', 'openai-api', 'nodejs', None, 'typescript', 'awesome-react-stuff', None, 'hacktoberfest', 'javascript', None, 'datascience', 'hacktoberfest', None, 'django', 'framework', 'security', None, 'codeinthedark', None, '2d', 'c', None, None, 'best-practices', None, 'react', 'go', 'e2payments', 'laravel', 'react', 'javascript', 'html', 'macos', None, 'components', 'typescript', 'javascript', 'hacktoberfest', 'laravel', 'applications', 'css', None, None, 'adminlte', 'create', 'admin', 'linux', 'react', 'guidelines', 'java', None, None, 'mpesa', 'exploitation', None, 'git', None, None, 'activemq', 'bash', 'books', None, 'advent-of-code', None, 'clean-architecture', 'javascript', None, None, None, 'config', None, 'algorithm-visualisation', 'cpp', None, 'javascript', None, 'curso-em-video', 'hacktoberfest', 'css', 'ruby', None, 'git', None, 'book', 'expo', 'react', 'calculations', None, 'vuejs', None, None, 'coding-in-community', 'hacktoberfest', 'nextjs14', 'curso', 'react', 'react', 'android', None, 'animated', 'canvas', None, 'binary', 'react-native', 'javascript', 'hacktoberfest', 'api', 'hacktoberfest', 'python', 'typescript', 'config', None, None, None, 'face-detection', 'machine-learning', 'dart', 'd3js', 'annotations', 'android', 'books', 'javascript', 'api', 'react', None, 'ai-images', 'education', 'boostrap', 'hacktoberfest', None, 'javascript', 'api', None, None, 'awesome-list', 'php', 'awesome', 'django', 'react', 'brands', 'gis', 'css3', 'laravel', None, 'cheat-sheet', 'typescript', 'algorithm', None, 'java', 'php', None, 'javascript', None, None, 'api', 'portfolio-site', 'hacktoberfest', None, 'community', 'react', None, 'javascript', 'java', 'begginers', None, None, 'config', 'advance-ecommerce-project', 'collaborate', 'php', 'config', 'javascript', 'javascript', 'react', 'collaborate', 'android', 'flutter', 'python', 'github', 'hacktoberfest', 'curso', None, None, 'capture', 'git', None, 'coming-soon-page', None, None, 'flutter', 'aws', None, None, None, 'awesome', 'python', 'typescript', 'nextjs', 'config', 'awesome-list', None, 'css3', None, None, 'bootstrap4', None, 'java', 'javascript', 'editor', None, 'hacktoberfest', 'best-practices', 'exploratorydataanalysis', 'javascript', 'cartography', 'excel', 'android', None, 'java17', 'attachment', None, 'crud', None, 'bootstrap5', 'portfolio', 'android', None, None, 'tutorial', None, 'recognition', None, 'bash-configuration', 'laravel', None, 'appsec', 'javascript', 'desktop', None, 'config', 'data-science', None, 'amazon', None, 'javascript', 'ios', None, 'javascript', 'animations', 'hacktoberfest', 'typescript', 'intern', 'typescript', 'awesome', None, 'deploy', 'javascript', 'game-development', 'javascript', 'aws-ses', 'javascript', 'artificial-intelligence', 'hacktoberfest', None, 'beginner-project', 'component', None, 'hacktoberfest', None, 'component', 'javascript', 'brasil', None, 'hacktoberfest', 'adhan', 'mozambique', 'css', None, 'javascript', None, 'projetos-em-java', None, 'declarative', None, 'java', 'react', None, 'game', 'cheat-sheet', None, 'dio', 'design-system', 'maintenance-page', 'hacktoberfest', 'brute-force', None, None, 'css3', None, 'dart', 'awesome-list', None, 'hacktoberfest', 'chat', 'agnus', 'hacktoberfest', 'gustavoguanabara', None, None, 'awesome-list', None, None, 'ai', None, 'angular-roadmap', None, 'java', None, 'e2payments', 'algorithms', 'rocketseat', 'reactjs', 'linux', 'apoio', 'sms', 'curso', 'mozambique', 'github', None, None, None, 'android', None, 'html-css', None, 'books', None, None, None, None, None, 'java', None, None, None, 'javascript', 'config', 'config', 'django', 'curso', None, 'curso']}\n" ] }, { @@ -198,13 +200,13 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 5, "id": "775ada8b", "metadata": {}, "outputs": [], "source": [ "users_data = pd.DataFrame(final_data)\n", - "users_data.to_csv(f\"../../data/processed/{dir_name}/starred.csv\", index=False, encoding='latin1')" + "users_data.to_csv(f\"{base_path}/starred.csv\", index=False, encoding='latin1')" ] }, { diff --git a/notebooks/01. data_collect/get_users_data.ipynb b/notebooks/01. data_collect/get_users_data.ipynb index b2328ca..ed1297f 100644 --- a/notebooks/01. data_collect/get_users_data.ipynb +++ b/notebooks/01. data_collect/get_users_data.ipynb @@ -51,8 +51,10 @@ "source": [ "# Load data from CSV file\n", "dir_name = os.getenv('DIR_NAME')\n", + "base_path = f'../../data/processed/{dir_name}'\n", + "os.makedirs(base_path, exist_ok=True)\n", "\n", - "users_ids = pd.read_csv(f'../../data/processed/{dir_name}/users_ids.csv', encoding='latin1')\n", + "users_ids = pd.read_csv(f'{base_path}/users_ids.csv', encoding='latin1')\n", "users_ids = users_ids['user_id'].to_list()" ] }, @@ -71,7 +73,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "Processing: 100%|██████████| 1729/1729 [26:52<00:00, 1.07it/s]" + "Processing: 100%|██████████| 1734/1734 [26:05<00:00, 1.11it/s] " ] }, { @@ -168,8 +170,8 @@ "final_data, unknown_province_data = get_users_data(users_ids)\n", "\n", "# Create a DataFrame with the new data\n", - "filename = f\"../../data/processed/{dir_name}/users_data.csv\"\n", - "up_filename = f\"../../data/processed/{dir_name}/unknown_province.csv\"\n", + "filename = f\"{base_path}/users_data.csv\"\n", + "up_filename = f\"{base_path}/unknown_province.csv\"\n", "\n", "users_data = pd.DataFrame(final_data)\n", "up_data = pd.DataFrame(unknown_province_data)\n", diff --git a/notebooks/01. data_collect/get_users_ids.ipynb b/notebooks/01. data_collect/get_users_ids.ipynb index c6da799..58ff1a4 100644 --- a/notebooks/01. data_collect/get_users_ids.ipynb +++ b/notebooks/01. data_collect/get_users_ids.ipynb @@ -50,10 +50,10 @@ "name": "stdout", "output_type": "stream", "text": [ - "Mozambique: 1382\n", - "Moçambique: 254\n", + "Mozambique: 1406\n", + "Moçambique: 256\n", "Mocambique: 44\n", - "Maputo: 1049\n", + "Maputo: 1065\n", "Matola: 64\n" ] } @@ -200,7 +200,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, "id": "53ebd458-ef4a-451d-b34a-0c2280f3dec1", "metadata": {}, "outputs": [ @@ -208,26 +208,26 @@ "name": "stdout", "output_type": "stream", "text": [ - "The IDs were successfully written to the file ../../data/raw/2024_04/mozambique.csv!\n", - "The IDs were successfully written to the file ../../data/raw/2024_04/moçambique.csv!\n", - "The IDs were successfully written to the file ../../data/raw/2024_04/mocambique.csv!\n", - "The IDs were successfully written to the file ../../data/raw/2024_04/maputo.csv!\n", - "The IDs were successfully written to the file ../../data/raw/2024_04/matola.csv!\n" + "The IDs were successfully written to the file ../../data/raw/2024_05/mozambique.csv!\n", + "The IDs were successfully written to the file ../../data/raw/2024_05/moçambique.csv!\n", + "The IDs were successfully written to the file ../../data/raw/2024_05/mocambique.csv!\n", + "The IDs were successfully written to the file ../../data/raw/2024_05/maputo.csv!\n", + "The IDs were successfully written to the file ../../data/raw/2024_05/matola.csv!\n" ] } ], "source": [ - "# Main\n", + "dir_name = os.getenv('DIR_NAME')\n", + "base_path = f'../../data/raw/{dir_name}'\n", + "\n", + "os.makedirs(base_path, exist_ok=True)\n", + "\n", "for loc in locations:\n", - " final_data = get_users_ids_by_location(loc) # Here we put the list of collected ids\n", + " final_data = get_users_ids_by_location(loc) \n", "\n", - " dir_name = os.getenv('DIR_NAME')\n", + " file_name = f'{base_path}/{loc.lower()}.csv'\n", " \n", - " file_name = f'../../data/raw/{dir_name}/{loc.lower()}.csv' # e.g.: '../../data/raw/2024_02/mozambique.csv'\n", - " \n", - " write_csv(final_data, file_name)\n", - "\n", - " final_data = []\n" + " write_csv(final_data, file_name)\n" ] }, {