Skip to content
Permalink
b1a05852fb
Switch branches/tags

Name already in use

A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
Go to file
 
 
Cannot retrieve contributors at this time
114 lines (91 sloc) 3.76 KB
from enum import Enum
import socket
class CorrelationMeasure(Enum):
UDS = 1
CMI = 2
MAC = 3
ID = 4
FID = 5
class DistanceMeasure(Enum):
ID = 1
CJS = 2
FID = 3
class InteractionType(Enum):
CUBES = 1
XORCUBES = 2
BLOBS = 3
XORBLOBS = 4
UNIFORM = 5
ID_THRESHOLD_QUANTILE = 0.3
ID_SLIDING_WINDOW = 40
NORMALIZATION_RADIUS = 1
FILE_DATA_OUTPUT = "out.arff"
FILE_DATA_CUTS = 'cut.txt'
FILE_NAME_PATTERN = '(?:.*/)*(.*)$'
# subspace mining parameters
MAX_SUBSPACE_SIZE = 5
DEFAULT_SM_K_RANGE=[2, 4, 8]
HETEROGENEOUS_THRESHOLD=0.8
BEAM_WIDTH=4
# cjs
CLUMP = 2
MAXMAX = 5
SUBSPACE_SET_STEP = 2
# class Environment(Enum):
# TEST = 1
# PRODUCTION = 2
#
# ENVIRONMENT = Environment.TEST
TRIVIAL_BINS_COUNT_LIST = [None, 5]
# old settings
TOTAL_IRRELEVANT_FEATURES = 100 if socket.gethostname() == 'push' else 3
#
# RELEVANT_FEATURES_UPPER_BOUND=3 if socket.gethostname() != 'push' else 31
# RELEVANT_FEATURES_LOWER_BOUND=2
#
# INTERACTIONS_UPPER_BOUND=4 if socket.gethostname() != 'push' else 11
# INTERACTIONS_LOWER_BOUND=3 if socket.gethostname() != 'push' else 1
# new settings (more constrained)
# main execution
IRRELEVANT_FEATURES_RANGE_LIST = [1, 2, 3, 4, 8, 16, 32, 64, 99, 6, 12, 24, 48, TOTAL_IRRELEVANT_FEATURES] \
if socket.gethostname() == 'push' else [1, 2, TOTAL_IRRELEVANT_FEATURES]
FOOTPRINTS_NUMBER_RANGE_LIST = [4, 8]
# datasets iterator (executes either real datasets or artificial datasets, depends on value of REAL_DATASETS)
REAL_DATASETS=None
# REAL_DATASETS=['gas', 'gas_small', 'gas_r128', 'gas_small_r128']
INTERACTION_TYPE_RANGE_LIST = [InteractionType.CUBES, InteractionType.XORCUBES,
InteractionType.BLOBS, InteractionType.XORBLOBS,
# InteractionType.UNIFORM
]
XOR_OFFSETS = [0, 1]
XOR_RELEVANT_FEATURES_RANGE_LIST = [3, 4, 5, 6] if socket.gethostname() == 'push' else [3]
CUBES_RELEVANT_FEATURES_RANGE_LIST = [4, 8] if socket.gethostname() == 'push' else [4]
INTERACTION_NUMBER_RANGE_LIST = [1, 2]
CUBES_NUMBER_RANGE_LIST = [1, 2]
ROWS_RANGE_LIST = [1000, 5000, 10000] if socket.gethostname() == 'push' else [1000]
# # datasets iterator (1 dataset)
# INTERACTION_TYPE_RANGE_LIST = [InteractionType.CUBES
# # InteractionType.UNIFORM
# ]
# XOR_OFFSETS = [0, 1]
# XOR_RELEVANT_FEATURES_RANGE_LIST = [3, 4, 5, 6] if socket.gethostname() == 'push' else [3]
# CUBES_RELEVANT_FEATURES_RANGE_LIST = [4, 8] if socket.gethostname() == 'push' else [4]
# INTERACTION_NUMBER_RANGE_LIST = [1]
# CUBES_NUMBER_RANGE_LIST = [1]
# ROWS_RANGE_LIST = [1000, 5000, 10000, 20000] if socket.gethostname() == 'push' else [1000]
# todo delete later
NAIVE_CHUNK_SIZE_RANGE_LIST = [2, 4, 10, 20] if socket.gethostname() == 'push' else [2]
BASE = '/local/tmp/ipd_extended_experiments2/' if socket.gethostname() == 'push' \
else '/Users/tatyanadembelova/Documents/study/thesis/ipd_extended/'
DATA_DIR = BASE + ('new_cubes/' if REAL_DATASETS is None else "data/")
PERFECT_DISCRETIZATIONS_DIR = BASE + 'ideal_disc/'
PERFECT_SUBSPACES_JSON = BASE + 'ideal_subspaces.json'
SLIM_BASE = ("/Users/tatyanadembelova/Documents/study/thesis/" if socket.gethostname() != 'push' else BASE) + "code-fic/"
SLIM_DATA_DIR = SLIM_BASE + "data/"
SLIM_BIN = SLIM_BASE + "branches/slim/trunk/fic"
SLIM_COMPRESS_CONF = SLIM_BASE + "branches/slim/trunk/compress.conf"
SLIM_CONVERT_CONF = SLIM_BASE + "branches/slim/trunk/convertdb.conf"
PRECISION_RECALL_FILENAME = "Precision_recall_runtime.csv"
COMPRESSION_FILENAME = "Compression.csv"
DETAILS_FILENAME = "Details.csv"
WEKA_BIN = "/local/tmp/ipd_extended_experiments2/weka/weka-3-9-1/weka.jar" if socket.gethostname() == 'push' else "/Users/tatyanadembelova/Downloads/weka-3-9-1/weka.jar"