|
2 | 2 | "cells": [
|
3 | 3 | {
|
4 | 4 | "cell_type": "code",
|
5 |
| - "execution_count": 1, |
| 5 | + "execution_count": 4, |
6 | 6 | "metadata": {},
|
7 | 7 | "outputs": [],
|
8 | 8 | "source": [
|
9 | 9 | "from magnet.ize.filings import Processor\n",
|
10 |
| - "source_data_file = \"./raw/kb_export_clean.csv\"\n", |
11 |
| - "export_data_file = \"./data/filings_mistral_nlp.parquet\"" |
| 10 | + "source_data_file = \"../../raw/kb_export_clean.csv\"\n", |
| 11 | + "export_data_file = \"../../data/filings_mistral_nlp.parquet\"" |
12 | 12 | ]
|
13 | 13 | },
|
14 | 14 | {
|
15 | 15 | "cell_type": "code",
|
16 |
| - "execution_count": 3, |
| 16 | + "execution_count": 5, |
17 | 17 | "metadata": {},
|
18 | 18 | "outputs": [
|
19 | 19 | {
|
20 | 20 | "name": "stdout",
|
21 | 21 | "output_type": "stream",
|
22 | 22 | "text": [
|
23 |
| - "\u001b[96m☕️ WAIT: loading - ./raw/kb_export_clean.csv\u001b[0m\n", |
24 |
| - "\u001b[92m🌊 SUCCESS: loaded - ./raw/kb_export_clean.csv\u001b[0m\n" |
| 23 | + "\u001b[96m☕️ WAIT: loading - ../raw/kb_export_clean.csv\u001b[0m\n", |
| 24 | + "\u001b[91m☠️ FATAL: [Errno 2] No such file or directory: '../raw/kb_export_clean.csv'\u001b[0m\n" |
25 | 25 | ]
|
26 | 26 | }
|
27 | 27 | ],
|
|
36 | 36 | },
|
37 | 37 | {
|
38 | 38 | "cell_type": "code",
|
39 |
| - "execution_count": 4, |
| 39 | + "execution_count": 3, |
40 | 40 | "metadata": {},
|
41 | 41 | "outputs": [
|
42 | 42 | {
|
43 |
| - "name": "stdout", |
44 |
| - "output_type": "stream", |
45 |
| - "text": [ |
46 |
| - "\u001b[96m☕️ WAIT: get coffee or tea - 65822 processing...\u001b[0m\n" |
47 |
| - ] |
48 |
| - }, |
49 |
| - { |
50 |
| - "name": "stderr", |
51 |
| - "output_type": "stream", |
52 |
| - "text": [ |
53 |
| - "100%|██████████| 65822/65822 [20:08<00:00, 54.48it/s] \n", |
54 |
| - "100%|██████████| 65822/65822 [00:02<00:00, 29005.30it/s]\n" |
55 |
| - ] |
56 |
| - }, |
57 |
| - { |
58 |
| - "name": "stdout", |
59 |
| - "output_type": "stream", |
60 |
| - "text": [ |
61 |
| - "\u001b[96m☕️ WAIT: saving to ./data/filings_mistral_nlp.parquet\u001b[0m\n", |
62 |
| - "\u001b[92m🌊 SUCCESS: saved - ./data/filings_mistral_nlp.parquet\u001b[0m\n" |
| 43 | + "ename": "AttributeError", |
| 44 | + "evalue": "'NoneType' object has no attribute 'dropna'", |
| 45 | + "output_type": "error", |
| 46 | + "traceback": [ |
| 47 | + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", |
| 48 | + "\u001b[0;31mAttributeError\u001b[0m Traceback (most recent call last)", |
| 49 | + "Cell \u001b[0;32mIn[3], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[38;5;28;01mawait\u001b[39;00m clustered_filings\u001b[38;5;241m.\u001b[39mprocess(\n\u001b[1;32m 2\u001b[0m export_data_file\n\u001b[1;32m 3\u001b[0m , nlp\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 4\u001b[0m )\n", |
| 50 | + "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/magnet/ize/filings.py:55\u001b[0m, in \u001b[0;36mProcessor.process\u001b[0;34m(self, path, splitter, nlp)\u001b[0m\n\u001b[1;32m 54\u001b[0m \u001b[38;5;28;01masync\u001b[39;00m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mprocess\u001b[39m(\u001b[38;5;28mself\u001b[39m, path: \u001b[38;5;28mstr\u001b[39m \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m, splitter: \u001b[38;5;28many\u001b[39m \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m, nlp\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m):\n\u001b[0;32m---> 55\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdf \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdf\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdropna\u001b[49m()\n\u001b[1;32m 56\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdf \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m 57\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n", |
| 51 | + "\u001b[0;31mAttributeError\u001b[0m: 'NoneType' object has no attribute 'dropna'" |
63 | 52 | ]
|
64 | 53 | }
|
65 | 54 | ],
|
|
0 commit comments