Skip to content

Commit c186a66

Browse files
Merge pull request #25 from aureliopatelli/main
solved problems with nan entries in pandas
2 parents cac80c0 + d046c70 commit c186a66

1 file changed

Lines changed: 4 additions & 3 deletions

File tree

fermi/matrix_processor.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -225,9 +225,8 @@ def _load_from_path(self, path: Path, **kwargs):
225225
conv = pd.to_numeric(first, errors="coerce")
226226
frac_nan = conv.isna().mean()
227227
if frac_nan > 0.5:
228-
# uso la prima colonna come indice e la rimuovo dai dati
229228
df = df.set_index(df.columns[0])
230-
return self._load_from_dataframe(df)
229+
return self._load_from_dataframe(df.fillna(0))
231230

232231
if ext in ['.xlsx','..xls']:
233232
df = pd.read_excel(path, **kwargs)
@@ -252,7 +251,9 @@ def _load_from_path(self, path: Path, **kwargs):
252251
def _load_from_dataframe(self, df: pd.DataFrame) -> Tuple[csr_matrix, List[str], List[str]]:
253252
rows = df.index.tolist() if not df.index.equals(pd.RangeIndex(len(df))) else []
254253
cols = df.columns.tolist() if not df.columns.equals(pd.RangeIndex(len(df.columns))) else []
255-
return sp.csr_matrix(df.values), rows, cols
254+
mat = sp.csr_matrix(df.values)
255+
mat.eliminate_zeros()
256+
return mat, rows, cols
256257

257258
def _load_from_other(self, obj: Any) -> csr_matrix:
258259
if sp.issparse(obj):

0 commit comments

Comments
 (0)