{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "53445797-52c4-4443-8095-889cf1c24298",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"%load_ext autoreload\n"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "4de950c8-cabe-4874-aa78-548342993b05",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"%autoreload 1"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "bccbd4ee-e6e7-4bc5-b72c-98196e811766",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"import pandas as pd\n"
]
},
{
"cell_type": "code",
"execution_count": 27,
"id": "7b337190-7887-40b7-9d10-b8039f5f2dfd",
"metadata": {},
"outputs": [],
"source": [
"project_df = pd.read_csv('encore-files/project.csv')\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "44729805-deb3-4c61-b019-c9f52c5898f0",
"metadata": {
"tags": []
},
"outputs": [
{
"data": {
"text/plain": [
"Index(['id', 'address', 'building_type', 'city', 'country', 'customer_name',\n",
" 'description', 'name', 'no_of_habitants', 'postal_code', 'projectuuid',\n",
" 'state', 'year_of_construction', 'bms_information_id',\n",
" 'project_coordinator_id', 'project_tag_id', 'ifc_before_tagid',\n",
" 'ifc_to_be_tagid', 'ifc_enhanced_tagid'],\n",
" dtype='object')"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"project_df.columns"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "561aa71c-c506-47b7-8b5f-6c00104a8e91",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"only_ifc_ids=project_df[['project_tag_id', 'c',\n",
" 'ifc_to_be_tagid', 'ifc_enhanced_tagid']]"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "0af0d724-4dc5-434d-8209-e6604330c4e9",
"metadata": {},
"outputs": [],
"source": [
"only_ifc_ids"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "d1fe283a-35cd-4bf6-80ef-bd1a68ac2961",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"def merge_cols(df):\n",
" df[\"all_ids\"] = df[\"project_tag_id\"] + df[\"project_tag_id\"] + df[\"ifc_to_be_tagid\"] + df[\"ifc_enhanced_tagid\"]\n",
" return df[[\"all_ids\"]]"
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "bfdca4ba-edf0-4394-b20d-8ab04130a30f",
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/tmp/ipykernel_98/3701186255.py:2: SettingWithCopyWarning: \n",
"A value is trying to be set on a copy of a slice from a DataFrame.\n",
"Try using .loc[row_indexer,col_indexer] = value instead\n",
"\n",
"See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
" df[\"all_ids\"] = df[\"project_tag_id\"] + df[\"project_tag_id\"] + df[\"ifc_to_be_tagid\"] + df[\"ifc_enhanced_tagid\"]\n"
]
}
],
"source": [
"ids_from_database = merge_cols(only_ifc_ids)"
]
},
{
"cell_type": "code",
"execution_count": 24,
"id": "b8aee40a-7cc9-41b0-a1ef-4c3ed293f229",
"metadata": {
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" all_ids | \n",
"
\n",
" \n",
" \n",
" \n",
" | 0 | \n",
" 97a3e117-a4b9-463f-81ed-8a0fd6826b1297a3e117-a... | \n",
"
\n",
" \n",
" | 1 | \n",
" NaN | \n",
"
\n",
" \n",
" | 2 | \n",
" NaN | \n",
"
\n",
" \n",
" | 3 | \n",
" NaN | \n",
"
\n",
" \n",
" | 4 | \n",
" b27ac00c-0b6f-4909-81db-ef8c136c1c28b27ac00c-0... | \n",
"
\n",
" \n",
" | 5 | \n",
" NaN | \n",
"
\n",
" \n",
" | 6 | \n",
" d48ed765-b997-4998-b48f-d5c6f37764a2d48ed765-b... | \n",
"
\n",
" \n",
" | 7 | \n",
" NaN | \n",
"
\n",
" \n",
" | 8 | \n",
" 3fe6a2a0-dcf6-4108-b079-085e7817b9333fe6a2a0-d... | \n",
"
\n",
" \n",
" | 9 | \n",
" 4036063b-84bf-4312-883d-306648307e814036063b-8... | \n",
"
\n",
" \n",
" | 10 | \n",
" 6e36b3b6-1b35-46a0-89b4-c64b2dcfc4d26e36b3b6-1... | \n",
"
\n",
" \n",
" | 11 | \n",
" NaN | \n",
"
\n",
" \n",
" | 12 | \n",
" 6c886d15-2ddf-489e-8440-066ad5c0c0516c886d15-2... | \n",
"
\n",
" \n",
" | 13 | \n",
" 6ba02956-f25b-4a68-8c02-0d6308b4460f6ba02956-f... | \n",
"
\n",
" \n",
" | 14 | \n",
" cc1e623d-ba33-4f84-8bfb-7d19d062cc20cc1e623d-b... | \n",
"
\n",
" \n",
" | 15 | \n",
" fe04ff9b-c1ff-41c4-9377-b7df1cfe2d22fe04ff9b-c... | \n",
"
\n",
" \n",
" | 16 | \n",
" aa0efa31-7f46-4511-bf25-1a14f724d43baa0efa31-7... | \n",
"
\n",
" \n",
" | 17 | \n",
" NaN | \n",
"
\n",
" \n",
" | 18 | \n",
" NaN | \n",
"
\n",
" \n",
" | 19 | \n",
" 5d768096-e9e0-4b2d-bd3b-5e48349fd4ca5d768096-e... | \n",
"
\n",
" \n",
" | 20 | \n",
" bdd29bf3-c04a-4dd2-85b8-28195d167dffbdd29bf3-c... | \n",
"
\n",
" \n",
" | 21 | \n",
" 67001609-3c2d-4963-9838-b211b0f5010667001609-3... | \n",
"
\n",
" \n",
" | 22 | \n",
" 9747c628-6b97-4b21-a9b2-7a249afedafb9747c628-6... | \n",
"
\n",
" \n",
" | 23 | \n",
" 02cafcb1-98aa-4a7c-bf1e-ddf55a9d5fbe02cafcb1-9... | \n",
"
\n",
" \n",
" | 24 | \n",
" ebff9dd8-e032-4bed-ab15-67279baf9604ebff9dd8-e... | \n",
"
\n",
" \n",
" | 25 | \n",
" 2aa3427a-5388-4bf7-8076-681f1b8ad5d42aa3427a-5... | \n",
"
\n",
" \n",
" | 26 | \n",
" 246a4471-9477-4adf-9ec5-42ad325733a6246a4471-9... | \n",
"
\n",
" \n",
" | 27 | \n",
" 337f2a2e-2826-4bc8-83c2-8c0459781c1d337f2a2e-2... | \n",
"
\n",
" \n",
" | 28 | \n",
" 7ac6f1a5-9ecb-4ab2-9fc1-7abad928544e7ac6f1a5-9... | \n",
"
\n",
" \n",
" | 29 | \n",
" a258185a-f60c-452e-82e3-572a544f22cca258185a-f... | \n",
"
\n",
" \n",
" | 30 | \n",
" e7bde166-4910-407b-9b1d-1943fbcd6da4e7bde166-4... | \n",
"
\n",
" \n",
" | 31 | \n",
" 5660466b-2600-4b9e-bbce-faf192cfc9065660466b-2... | \n",
"
\n",
" \n",
" | 32 | \n",
" c4cd356d-9d70-4952-8f18-39b3807c81dfc4cd356d-9... | \n",
"
\n",
" \n",
" | 33 | \n",
" 1fc260f6-4713-4b06-a680-38614db8d9561fc260f6-4... | \n",
"
\n",
" \n",
" | 34 | \n",
" 432c91b2-ff25-469f-a623-3f39d5ed67d2432c91b2-f... | \n",
"
\n",
" \n",
" | 35 | \n",
" 7397b503-33ab-47ef-acbe-09edb2176ff37397b503-3... | \n",
"
\n",
" \n",
" | 36 | \n",
" 8269294e-a9b0-483c-8abe-25dbda0656cf8269294e-a... | \n",
"
\n",
" \n",
" | 37 | \n",
" f2b10aa9-536d-4968-ba7b-eaa98e717f43f2b10aa9-5... | \n",
"
\n",
" \n",
" | 38 | \n",
" ed5db4a1-5560-4753-9c6b-4e4dc3168ddfed5db4a1-5... | \n",
"
\n",
" \n",
" | 39 | \n",
" aa252dd8-4d8e-45ec-ab5e-a531085c2459aa252dd8-4... | \n",
"
\n",
" \n",
" | 40 | \n",
" 6aff4eb5-c6f3-4a3a-8052-0e9d2525969d6aff4eb5-c... | \n",
"
\n",
" \n",
" | 41 | \n",
" e4909d99-cf20-4334-835b-598c66ee2ce1e4909d99-c... | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" all_ids\n",
"0 97a3e117-a4b9-463f-81ed-8a0fd6826b1297a3e117-a...\n",
"1 NaN\n",
"2 NaN\n",
"3 NaN\n",
"4 b27ac00c-0b6f-4909-81db-ef8c136c1c28b27ac00c-0...\n",
"5 NaN\n",
"6 d48ed765-b997-4998-b48f-d5c6f37764a2d48ed765-b...\n",
"7 NaN\n",
"8 3fe6a2a0-dcf6-4108-b079-085e7817b9333fe6a2a0-d...\n",
"9 4036063b-84bf-4312-883d-306648307e814036063b-8...\n",
"10 6e36b3b6-1b35-46a0-89b4-c64b2dcfc4d26e36b3b6-1...\n",
"11 NaN\n",
"12 6c886d15-2ddf-489e-8440-066ad5c0c0516c886d15-2...\n",
"13 6ba02956-f25b-4a68-8c02-0d6308b4460f6ba02956-f...\n",
"14 cc1e623d-ba33-4f84-8bfb-7d19d062cc20cc1e623d-b...\n",
"15 fe04ff9b-c1ff-41c4-9377-b7df1cfe2d22fe04ff9b-c...\n",
"16 aa0efa31-7f46-4511-bf25-1a14f724d43baa0efa31-7...\n",
"17 NaN\n",
"18 NaN\n",
"19 5d768096-e9e0-4b2d-bd3b-5e48349fd4ca5d768096-e...\n",
"20 bdd29bf3-c04a-4dd2-85b8-28195d167dffbdd29bf3-c...\n",
"21 67001609-3c2d-4963-9838-b211b0f5010667001609-3...\n",
"22 9747c628-6b97-4b21-a9b2-7a249afedafb9747c628-6...\n",
"23 02cafcb1-98aa-4a7c-bf1e-ddf55a9d5fbe02cafcb1-9...\n",
"24 ebff9dd8-e032-4bed-ab15-67279baf9604ebff9dd8-e...\n",
"25 2aa3427a-5388-4bf7-8076-681f1b8ad5d42aa3427a-5...\n",
"26 246a4471-9477-4adf-9ec5-42ad325733a6246a4471-9...\n",
"27 337f2a2e-2826-4bc8-83c2-8c0459781c1d337f2a2e-2...\n",
"28 7ac6f1a5-9ecb-4ab2-9fc1-7abad928544e7ac6f1a5-9...\n",
"29 a258185a-f60c-452e-82e3-572a544f22cca258185a-f...\n",
"30 e7bde166-4910-407b-9b1d-1943fbcd6da4e7bde166-4...\n",
"31 5660466b-2600-4b9e-bbce-faf192cfc9065660466b-2...\n",
"32 c4cd356d-9d70-4952-8f18-39b3807c81dfc4cd356d-9...\n",
"33 1fc260f6-4713-4b06-a680-38614db8d9561fc260f6-4...\n",
"34 432c91b2-ff25-469f-a623-3f39d5ed67d2432c91b2-f...\n",
"35 7397b503-33ab-47ef-acbe-09edb2176ff37397b503-3...\n",
"36 8269294e-a9b0-483c-8abe-25dbda0656cf8269294e-a...\n",
"37 f2b10aa9-536d-4968-ba7b-eaa98e717f43f2b10aa9-5...\n",
"38 ed5db4a1-5560-4753-9c6b-4e4dc3168ddfed5db4a1-5...\n",
"39 aa252dd8-4d8e-45ec-ab5e-a531085c2459aa252dd8-4...\n",
"40 6aff4eb5-c6f3-4a3a-8052-0e9d2525969d6aff4eb5-c...\n",
"41 e4909d99-cf20-4334-835b-598c66ee2ce1e4909d99-c..."
]
},
"execution_count": 24,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"ids_from_database"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "f52b6cc0-e0ea-479b-a24e-d4bcfa769bd2",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"converted_files_df = pd.read_csv('encore-files/filenames-only.csv')\n"
]
},
{
"cell_type": "code",
"execution_count": 26,
"id": "da181f14-a495-4950-b4f4-cba92b099184",
"metadata": {
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" foldername | \n",
"
\n",
" \n",
" \n",
" \n",
" | 238590 | \n",
" fffb5e51-74ec-4829-8074-fc095346c8a6 | \n",
"
\n",
" \n",
" | 238591 | \n",
" fffc44dd-2c8d-4d71-b08e-e192e7ad9b37 | \n",
"
\n",
" \n",
" | 238592 | \n",
" fffc79c6-5f47-4641-87c6-57cc28478f73 | \n",
"
\n",
" \n",
" | 238593 | \n",
" fffcc424-c740-46da-b57c-cc97be249524 | \n",
"
\n",
" \n",
" | 238594 | \n",
" fffcda08-0da5-4c2a-ab94-fd49477d18dc | \n",
"
\n",
" \n",
" | 238595 | \n",
" fffd27c4-ca0b-4067-96d8-848f50a43224 | \n",
"
\n",
" \n",
" | 238596 | \n",
" fffdab41-f136-4eaa-b870-68aff14e0763 | \n",
"
\n",
" \n",
" | 238597 | \n",
" fffdedf2-3063-4da8-b7da-cfd7eb76cf90 | \n",
"
\n",
" \n",
" | 238598 | \n",
" fffdf3d8-7069-4c19-90b5-d96d7459b54d | \n",
"
\n",
" \n",
" | 238599 | \n",
" fffe0eff-dd7e-4dbb-9f71-29401c553e25 | \n",
"
\n",
" \n",
" | 238600 | \n",
" ffff29a7-ae72-4620-9abf-e3919bd23fe5 | \n",
"
\n",
" \n",
" | 238601 | \n",
" ffff502d-7393-4425-898d-21fefd5bc0e3 | \n",
"
\n",
" \n",
" | 238602 | \n",
" ffff5b42-575a-48c0-8093-61db051f903b | \n",
"
\n",
" \n",
" | 238603 | \n",
" ffff83bb-bbc8-43c1-a219-e35a5b2e28bd | \n",
"
\n",
" \n",
" | 238604 | \n",
" ffffc0e5-0a22-41b1-9d50-c532e2c313aa | \n",
"
\n",
" \n",
" | 238605 | \n",
" filenames-only.txt | \n",
"
\n",
" \n",
" | 238606 | \n",
" filenames.txt | \n",
"
\n",
" \n",
" | 238607 | \n",
" files.txt | \n",
"
\n",
" \n",
" | 238608 | \n",
" files2.txt | \n",
"
\n",
" \n",
" | 238609 | \n",
" index.json | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" foldername\n",
"238590 fffb5e51-74ec-4829-8074-fc095346c8a6\n",
"238591 fffc44dd-2c8d-4d71-b08e-e192e7ad9b37\n",
"238592 fffc79c6-5f47-4641-87c6-57cc28478f73\n",
"238593 fffcc424-c740-46da-b57c-cc97be249524\n",
"238594 fffcda08-0da5-4c2a-ab94-fd49477d18dc\n",
"238595 fffd27c4-ca0b-4067-96d8-848f50a43224\n",
"238596 fffdab41-f136-4eaa-b870-68aff14e0763\n",
"238597 fffdedf2-3063-4da8-b7da-cfd7eb76cf90\n",
"238598 fffdf3d8-7069-4c19-90b5-d96d7459b54d\n",
"238599 fffe0eff-dd7e-4dbb-9f71-29401c553e25\n",
"238600 ffff29a7-ae72-4620-9abf-e3919bd23fe5\n",
"238601 ffff502d-7393-4425-898d-21fefd5bc0e3\n",
"238602 ffff5b42-575a-48c0-8093-61db051f903b\n",
"238603 ffff83bb-bbc8-43c1-a219-e35a5b2e28bd\n",
"238604 ffffc0e5-0a22-41b1-9d50-c532e2c313aa\n",
"238605 filenames-only.txt\n",
"238606 filenames.txt\n",
"238607 files.txt\n",
"238608 files2.txt\n",
"238609 index.json"
]
},
"execution_count": 26,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"converted_files_df.tail(20)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "fd2c24b7-ddb1-4d77-9a38-7e11599e91c5",
"metadata": {},
"outputs": [],
"source": [
"converted_files_df['foldername']"
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "2fe47979-1a5b-41b4-9b11-5cb4616e6fd8",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"def get_diff_for_two_dataframes(df1, df2):\n",
" \"\"\"Returns set of values unique to df1\n",
" \"\"\"\n",
" diff = df1[df1['all_ids'].isin(df2['foldername']) == False]\n",
" return diff"
]
},
{
"cell_type": "code",
"execution_count": 25,
"id": "5f5a9b4e-91e0-4cbf-8f31-e5cda02d88dc",
"metadata": {
"tags": []
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" | \n",
" all_ids | \n",
"
\n",
" \n",
" \n",
" \n",
" | 0 | \n",
" 97a3e117-a4b9-463f-81ed-8a0fd6826b1297a3e117-a... | \n",
"
\n",
" \n",
" | 1 | \n",
" NaN | \n",
"
\n",
" \n",
" | 2 | \n",
" NaN | \n",
"
\n",
" \n",
" | 3 | \n",
" NaN | \n",
"
\n",
" \n",
" | 4 | \n",
" b27ac00c-0b6f-4909-81db-ef8c136c1c28b27ac00c-0... | \n",
"
\n",
" \n",
" | 5 | \n",
" NaN | \n",
"
\n",
" \n",
" | 6 | \n",
" d48ed765-b997-4998-b48f-d5c6f37764a2d48ed765-b... | \n",
"
\n",
" \n",
" | 7 | \n",
" NaN | \n",
"
\n",
" \n",
" | 8 | \n",
" 3fe6a2a0-dcf6-4108-b079-085e7817b9333fe6a2a0-d... | \n",
"
\n",
" \n",
" | 9 | \n",
" 4036063b-84bf-4312-883d-306648307e814036063b-8... | \n",
"
\n",
" \n",
" | 10 | \n",
" 6e36b3b6-1b35-46a0-89b4-c64b2dcfc4d26e36b3b6-1... | \n",
"
\n",
" \n",
" | 11 | \n",
" NaN | \n",
"
\n",
" \n",
" | 12 | \n",
" 6c886d15-2ddf-489e-8440-066ad5c0c0516c886d15-2... | \n",
"
\n",
" \n",
" | 13 | \n",
" 6ba02956-f25b-4a68-8c02-0d6308b4460f6ba02956-f... | \n",
"
\n",
" \n",
" | 14 | \n",
" cc1e623d-ba33-4f84-8bfb-7d19d062cc20cc1e623d-b... | \n",
"
\n",
" \n",
" | 15 | \n",
" fe04ff9b-c1ff-41c4-9377-b7df1cfe2d22fe04ff9b-c... | \n",
"
\n",
" \n",
" | 16 | \n",
" aa0efa31-7f46-4511-bf25-1a14f724d43baa0efa31-7... | \n",
"
\n",
" \n",
" | 17 | \n",
" NaN | \n",
"
\n",
" \n",
" | 18 | \n",
" NaN | \n",
"
\n",
" \n",
" | 19 | \n",
" 5d768096-e9e0-4b2d-bd3b-5e48349fd4ca5d768096-e... | \n",
"
\n",
" \n",
" | 20 | \n",
" bdd29bf3-c04a-4dd2-85b8-28195d167dffbdd29bf3-c... | \n",
"
\n",
" \n",
" | 21 | \n",
" 67001609-3c2d-4963-9838-b211b0f5010667001609-3... | \n",
"
\n",
" \n",
" | 22 | \n",
" 9747c628-6b97-4b21-a9b2-7a249afedafb9747c628-6... | \n",
"
\n",
" \n",
" | 23 | \n",
" 02cafcb1-98aa-4a7c-bf1e-ddf55a9d5fbe02cafcb1-9... | \n",
"
\n",
" \n",
" | 24 | \n",
" ebff9dd8-e032-4bed-ab15-67279baf9604ebff9dd8-e... | \n",
"
\n",
" \n",
" | 25 | \n",
" 2aa3427a-5388-4bf7-8076-681f1b8ad5d42aa3427a-5... | \n",
"
\n",
" \n",
" | 26 | \n",
" 246a4471-9477-4adf-9ec5-42ad325733a6246a4471-9... | \n",
"
\n",
" \n",
" | 27 | \n",
" 337f2a2e-2826-4bc8-83c2-8c0459781c1d337f2a2e-2... | \n",
"
\n",
" \n",
" | 28 | \n",
" 7ac6f1a5-9ecb-4ab2-9fc1-7abad928544e7ac6f1a5-9... | \n",
"
\n",
" \n",
" | 29 | \n",
" a258185a-f60c-452e-82e3-572a544f22cca258185a-f... | \n",
"
\n",
" \n",
" | 30 | \n",
" e7bde166-4910-407b-9b1d-1943fbcd6da4e7bde166-4... | \n",
"
\n",
" \n",
" | 31 | \n",
" 5660466b-2600-4b9e-bbce-faf192cfc9065660466b-2... | \n",
"
\n",
" \n",
" | 32 | \n",
" c4cd356d-9d70-4952-8f18-39b3807c81dfc4cd356d-9... | \n",
"
\n",
" \n",
" | 33 | \n",
" 1fc260f6-4713-4b06-a680-38614db8d9561fc260f6-4... | \n",
"
\n",
" \n",
" | 34 | \n",
" 432c91b2-ff25-469f-a623-3f39d5ed67d2432c91b2-f... | \n",
"
\n",
" \n",
" | 35 | \n",
" 7397b503-33ab-47ef-acbe-09edb2176ff37397b503-3... | \n",
"
\n",
" \n",
" | 36 | \n",
" 8269294e-a9b0-483c-8abe-25dbda0656cf8269294e-a... | \n",
"
\n",
" \n",
" | 37 | \n",
" f2b10aa9-536d-4968-ba7b-eaa98e717f43f2b10aa9-5... | \n",
"
\n",
" \n",
" | 38 | \n",
" ed5db4a1-5560-4753-9c6b-4e4dc3168ddfed5db4a1-5... | \n",
"
\n",
" \n",
" | 39 | \n",
" aa252dd8-4d8e-45ec-ab5e-a531085c2459aa252dd8-4... | \n",
"
\n",
" \n",
" | 40 | \n",
" 6aff4eb5-c6f3-4a3a-8052-0e9d2525969d6aff4eb5-c... | \n",
"
\n",
" \n",
" | 41 | \n",
" e4909d99-cf20-4334-835b-598c66ee2ce1e4909d99-c... | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" all_ids\n",
"0 97a3e117-a4b9-463f-81ed-8a0fd6826b1297a3e117-a...\n",
"1 NaN\n",
"2 NaN\n",
"3 NaN\n",
"4 b27ac00c-0b6f-4909-81db-ef8c136c1c28b27ac00c-0...\n",
"5 NaN\n",
"6 d48ed765-b997-4998-b48f-d5c6f37764a2d48ed765-b...\n",
"7 NaN\n",
"8 3fe6a2a0-dcf6-4108-b079-085e7817b9333fe6a2a0-d...\n",
"9 4036063b-84bf-4312-883d-306648307e814036063b-8...\n",
"10 6e36b3b6-1b35-46a0-89b4-c64b2dcfc4d26e36b3b6-1...\n",
"11 NaN\n",
"12 6c886d15-2ddf-489e-8440-066ad5c0c0516c886d15-2...\n",
"13 6ba02956-f25b-4a68-8c02-0d6308b4460f6ba02956-f...\n",
"14 cc1e623d-ba33-4f84-8bfb-7d19d062cc20cc1e623d-b...\n",
"15 fe04ff9b-c1ff-41c4-9377-b7df1cfe2d22fe04ff9b-c...\n",
"16 aa0efa31-7f46-4511-bf25-1a14f724d43baa0efa31-7...\n",
"17 NaN\n",
"18 NaN\n",
"19 5d768096-e9e0-4b2d-bd3b-5e48349fd4ca5d768096-e...\n",
"20 bdd29bf3-c04a-4dd2-85b8-28195d167dffbdd29bf3-c...\n",
"21 67001609-3c2d-4963-9838-b211b0f5010667001609-3...\n",
"22 9747c628-6b97-4b21-a9b2-7a249afedafb9747c628-6...\n",
"23 02cafcb1-98aa-4a7c-bf1e-ddf55a9d5fbe02cafcb1-9...\n",
"24 ebff9dd8-e032-4bed-ab15-67279baf9604ebff9dd8-e...\n",
"25 2aa3427a-5388-4bf7-8076-681f1b8ad5d42aa3427a-5...\n",
"26 246a4471-9477-4adf-9ec5-42ad325733a6246a4471-9...\n",
"27 337f2a2e-2826-4bc8-83c2-8c0459781c1d337f2a2e-2...\n",
"28 7ac6f1a5-9ecb-4ab2-9fc1-7abad928544e7ac6f1a5-9...\n",
"29 a258185a-f60c-452e-82e3-572a544f22cca258185a-f...\n",
"30 e7bde166-4910-407b-9b1d-1943fbcd6da4e7bde166-4...\n",
"31 5660466b-2600-4b9e-bbce-faf192cfc9065660466b-2...\n",
"32 c4cd356d-9d70-4952-8f18-39b3807c81dfc4cd356d-9...\n",
"33 1fc260f6-4713-4b06-a680-38614db8d9561fc260f6-4...\n",
"34 432c91b2-ff25-469f-a623-3f39d5ed67d2432c91b2-f...\n",
"35 7397b503-33ab-47ef-acbe-09edb2176ff37397b503-3...\n",
"36 8269294e-a9b0-483c-8abe-25dbda0656cf8269294e-a...\n",
"37 f2b10aa9-536d-4968-ba7b-eaa98e717f43f2b10aa9-5...\n",
"38 ed5db4a1-5560-4753-9c6b-4e4dc3168ddfed5db4a1-5...\n",
"39 aa252dd8-4d8e-45ec-ab5e-a531085c2459aa252dd8-4...\n",
"40 6aff4eb5-c6f3-4a3a-8052-0e9d2525969d6aff4eb5-c...\n",
"41 e4909d99-cf20-4334-835b-598c66ee2ce1e4909d99-c..."
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"get_diff_for_two_dataframes_by_single_col(ids_from_database, converted_files_df)"
]
},
{
"cell_type": "markdown",
"id": "ee2080ff-3a50-4170-894e-c617509ac578",
"metadata": {},
"source": [
" - length of array is the same, so no ifc files from the database are included there\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "0af46bf5-95f2-4fbf-af03-e2ba0f94c1f9",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"id": "47cd4a1f-96b9-4cdd-9d50-9fcb9a1000e2",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.10"
}
},
"nbformat": 4,
"nbformat_minor": 5
}