Skip to content

Commit 10ee2e8

Browse files
committed
fsspark -> fslite
1 parent c2312c8 commit 10ee2e8

31 files changed

+67
-146
lines changed

docs/README.data.md

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -37,19 +37,21 @@ The following is an example of a TSV file with a binary response variable:
3737
- `import_table` - Import data from a TSV file into a Spark Data Frame (sdf).
3838

3939
```python
40-
from fsspark.utils.io import import_table
41-
sdf = import_table('data.tsv.bgz',
42-
sep='\t',
43-
n_partitions=5)
40+
from fslite.utils.io import import_table
41+
42+
sdf = import_table('data.tsv.bgz',
43+
sep='\t',
44+
n_partitions=5)
4445
```
4546

4647
- `import_table_as_psdf` - Import data from a TSV file into a Spark Data Frame (sdf) and
4748
convert it into a Pandas on Spark Data Frame (psdf).
4849

4950
```python
50-
from fsspark.utils.io import import_table_as_psdf
51-
psdf = import_table_as_psdf('data.tsv.bgz',
52-
sep='\t',
51+
from fslite.utils.io import import_table_as_psdf
52+
53+
psdf = import_table_as_psdf('data.tsv.bgz',
54+
sep='\t',
5355
n_partitions=5)
5456
```
5557

@@ -73,9 +75,9 @@ contains the response variable.
7375
#### How to create a Feature Selection Spark Data Frame (FSDF)
7476

7577
```python
76-
from fsspark.config.context import init_spark, stop_spark_session
77-
from fsspark.fs.core import FSDataFrame
78-
from fsspark.utils.io import import_table_as_psdf
78+
from fslite.config.context import init_spark, stop_spark_session
79+
from fslite.fs.core import FSDataFrame
80+
from fslite.utils.io import import_table_as_psdf
7981

8082
# Init spark
8183
init_spark()

docs/README.methods.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,4 +53,4 @@ A typical workflow written using `fsspark` can be divided roughly in four major
5353

5454
### 5. Feature selection pipeline example
5555

56-
[FS pipeline example](../fsspark/pipeline/fs_pipeline_example.py)
56+
[FS pipeline example](../fslite/pipeline/fs_pipeline_example.py)

environment.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
name: fsspark-venv
1+
name: fslite-venv
22
channels:
33
- defaults
44
- conda-forge
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.

fsspark/fs/methods.py renamed to fslite/fs/methods.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
11
from abc import ABC, abstractmethod
22
from typing import List, Type, Union, Tuple, Optional, Dict, Any
33

4-
from fsspark.fs.constants import (ML_METHODS, UNIVARIATE_METHODS,
5-
MULTIVARIATE_METHODS)
6-
from fsspark.fs.core import FSDataFrame
7-
from fsspark.fs.ml import MLCVModel
8-
from fsspark.fs.multivariate import multivariate_filter
9-
from fsspark.fs.univariate import univariate_filter
4+
from fslite.fs.constants import (ML_METHODS, UNIVARIATE_METHODS,
5+
MULTIVARIATE_METHODS)
6+
from fslite.fs.core import FSDataFrame
7+
from fslite.fs.ml import MLCVModel
8+
from fslite.fs.multivariate import multivariate_filter
9+
from fslite.fs.univariate import univariate_filter
1010

1111

1212
class FSMethod(ABC):

fsspark/fs/ml.py renamed to fslite/fs/ml.py

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -20,15 +20,15 @@
2020
from pyspark.ml.regression import RandomForestRegressionModel, RandomForestRegressor
2121
from pyspark.ml.tuning import CrossValidator, ParamGridBuilder, CrossValidatorModel, Param
2222

23-
from fsspark.fs.constants import (RF_BINARY,
24-
LSVC_BINARY,
25-
FM_BINARY,
26-
RF_MULTILABEL,
27-
LR_MULTILABEL,
28-
RF_REGRESSION,
29-
FM_REGRESSION,
30-
ML_METHODS)
31-
from fsspark.fs.core import FSDataFrame
23+
from fslite.fs.constants import (RF_BINARY,
24+
LSVC_BINARY,
25+
FM_BINARY,
26+
RF_MULTILABEL,
27+
LR_MULTILABEL,
28+
RF_REGRESSION,
29+
FM_REGRESSION,
30+
ML_METHODS)
31+
from fslite.fs.core import FSDataFrame
3232

3333
ESTIMATORS_CLASSES = [RandomForestClassifier, RandomForestRegressionModel, LinearSVC, LogisticRegression]
3434
EVALUATORS_CLASSES = [BinaryClassificationEvaluator, MulticlassClassificationEvaluator, RegressionEvaluator]

fsspark/fs/multivariate.py renamed to fslite/fs/multivariate.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,11 +6,11 @@
66
from pyspark.ml.feature import (VarianceThresholdSelector)
77
from pyspark.ml.stat import Correlation
88

9-
from fsspark.fs.constants import MULTIVARIATE_METHODS, MULTIVARIATE_CORRELATION, MULTIVARIATE_VARIANCE
9+
from fslite.fs.constants import MULTIVARIATE_METHODS, MULTIVARIATE_CORRELATION, MULTIVARIATE_VARIANCE
1010

11-
from fsspark.fs.core import FSDataFrame
12-
from fsspark.fs.utils import find_maximal_independent_set
13-
from fsspark.utils.generic import tag
11+
from fslite.fs.core import FSDataFrame
12+
from fslite.fs.utils import find_maximal_independent_set
13+
from fslite.utils.generic import tag
1414

1515
logging.basicConfig(format="%(levelname)s (%(name)s %(lineno)s): %(message)s")
1616
logger = logging.getLogger("FSSPARK:MULTIVARIATE")

0 commit comments

Comments
 (0)