{ "cells": [ { "cell_type": "code", "execution_count": 20, "id": "3760b040-985c-46ec-ba77-13f0f7a52c83", "metadata": {}, "outputs": [], "source": [ "from pathlib import Path\n", "\n", "from lang_main import load_pickle" ] }, { "cell_type": "code", "execution_count": 28, "id": "97487448-82c8-4b3d-8a1a-ccccaaac8d86", "metadata": {}, "outputs": [], "source": [ "def get_files(path: str) -> tuple[Path, ...]:\n", " p = Path(r'A:\\Arbeitsaufgaben\\lang-main\\scripts\\results\\test_20240529')\n", " assert p.exists(), \"path does not exist\"\n", " return tuple(p.glob(r'*'))" ] }, { "cell_type": "code", "execution_count": 87, "id": "598f4d99-9d35-49c9-8c5d-113d4c80cecf", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(WindowsPath('A:/Arbeitsaufgaben/lang-main/scripts/results/test_20240529/Pipe-TargetFeature_Step-3_remove_NA.pkl'),\n", " WindowsPath('A:/Arbeitsaufgaben/lang-main/scripts/results/test_20240529/Pipe-TargetFeature_Step-5_analyse_feature.pkl'),\n", " WindowsPath('A:/Arbeitsaufgaben/lang-main/scripts/results/test_20240529/Pipe-Merge_Duplicates_Step-1_merge_similarity_dupl.pkl'))" ] }, "execution_count": 87, "metadata": {}, "output_type": "execute_result" } ], "source": [ "files = get_files(r'A:\\Arbeitsaufgaben\\lang-main\\scripts\\results\\test_20240529')\n", "files" ] }, { "cell_type": "code", "execution_count": 88, "id": "55ad4af3-87cd-4189-9309-171aba4e04a6", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "shared:INFO | 2024-05-29 12:49:47 +0000 | Loaded file successfully.\n" ] } ], "source": [ "file = files[-1]\n", "ret = load_pickle(file)" ] }, { "cell_type": "code", "execution_count": 89, "id": "540f4720-a2bf-4171-8db5-8e6993d38c13", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | entry | \n", "len | \n", "num_occur | \n", "assoc_obj_ids | \n", "num_assoc_obj_ids | \n", "
|---|---|---|---|---|---|
| 162 | \n", "Tägliche Wartungstätigkeiten nach Vorgabe des ... | \n", "66 | \n", "92592 | \n", "[0, 17, 41, 42, 43, 44, 45, 46, 47, 51, 52, 53... | \n", "206 | \n", "
| 33 | \n", "Wöchentliche Sichtkontrolle / Reinigung | \n", "39 | \n", "3108 | \n", "[301, 304, 305, 313, 314, 323, 329, 331, 332, ... | \n", "74 | \n", "
| 131 | \n", "Tägliche Überprüfung der Ölabscheider | \n", "37 | \n", "1619 | \n", "[0, 970, 2134, 2137] | \n", "4 | \n", "
| 160 | \n", "Wöchentliche Kontrolle der C-Anlagen | \n", "36 | \n", "1265 | \n", "[1352, 1353, 1354, 1684, 1685, 1686, 1687, 168... | \n", "11 | \n", "
| 140 | \n", "Halbjährliche Kontrolle des Stabbreithalters | \n", "44 | \n", "687 | \n", "[51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 6... | \n", "166 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2559 | \n", "Fehler 9723 Leistungsversorgung Antrieb defekt | \n", "46 | \n", "1 | \n", "[211] | \n", "1 | \n", "
| 2558 | \n", "T-Warp-Let-Off1 schleppfehler | \n", "30 | \n", "1 | \n", "[93] | \n", "1 | \n", "
| 2557 | \n", "Fahrräder wurden gewartet und gereinigt. | \n", "40 | \n", "1 | \n", "[1707] | \n", "1 | \n", "
| 2556 | \n", "Bohrlöcher an Gebots- und Verbotszeichen anbri... | \n", "173 | \n", "1 | \n", "[1] | \n", "1 | \n", "
| 6782 | \n", "Befestigung Deckel für Batteriefach defekt ... | \n", "106 | \n", "2 | \n", "[306, 326] | \n", "2 | \n", "
4545 rows × 5 columns
\n", "| \n", " | index | \n", "entry | \n", "len | \n", "num_occur | \n", "assoc_obj_ids | \n", "num_assoc_obj_ids | \n", "
|---|---|---|---|---|---|---|
| 0 | \n", "162 | \n", "Tägliche Wartungstätigkeiten nach Vorgabe des ... | \n", "66 | \n", "92592 | \n", "[0, 17, 41, 42, 43, 44, 45, 46, 47, 51, 52, 53... | \n", "206 | \n", "
| 1 | \n", "33 | \n", "Wöchentliche Sichtkontrolle / Reinigung | \n", "39 | \n", "3108 | \n", "[301, 304, 305, 313, 314, 323, 329, 331, 332, ... | \n", "74 | \n", "
| 2 | \n", "131 | \n", "Tägliche Überprüfung der Ölabscheider | \n", "37 | \n", "1619 | \n", "[0, 970, 2134, 2137] | \n", "4 | \n", "
| 3 | \n", "160 | \n", "Wöchentliche Kontrolle der C-Anlagen | \n", "36 | \n", "1265 | \n", "[1352, 1353, 1354, 1684, 1685, 1686, 1687, 168... | \n", "11 | \n", "
| 4 | \n", "140 | \n", "Halbjährliche Kontrolle des Stabbreithalters | \n", "44 | \n", "687 | \n", "[51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 6... | \n", "166 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 6756 | \n", "2559 | \n", "Fehler 9723 Leistungsversorgung Antrieb defekt | \n", "46 | \n", "1 | \n", "[211] | \n", "1 | \n", "
| 6757 | \n", "2558 | \n", "T-Warp-Let-Off1 schleppfehler | \n", "30 | \n", "1 | \n", "[93] | \n", "1 | \n", "
| 6758 | \n", "2557 | \n", "Fahrräder wurden gewartet und gereinigt. | \n", "40 | \n", "1 | \n", "[1707] | \n", "1 | \n", "
| 6759 | \n", "2556 | \n", "Bohrlöcher an Gebots- und Verbotszeichen anbri... | \n", "173 | \n", "1 | \n", "[1] | \n", "1 | \n", "
| 6760 | \n", "6782 | \n", "Befestigung Deckel für Batteriefach defekt ... | \n", "106 | \n", "2 | \n", "[306, 326] | \n", "2 | \n", "
4545 rows × 6 columns
\n", "