Permalink
Cannot retrieve contributors at this time
Name already in use
A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
ipd_extended/constants.py
Go to fileThis commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
114 lines (91 sloc)
3.76 KB
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
from enum import Enum | |
import socket | |
class CorrelationMeasure(Enum): | |
UDS = 1 | |
CMI = 2 | |
MAC = 3 | |
ID = 4 | |
FID = 5 | |
class DistanceMeasure(Enum): | |
ID = 1 | |
CJS = 2 | |
FID = 3 | |
class InteractionType(Enum): | |
CUBES = 1 | |
XORCUBES = 2 | |
BLOBS = 3 | |
XORBLOBS = 4 | |
UNIFORM = 5 | |
ID_THRESHOLD_QUANTILE = 0.3 | |
ID_SLIDING_WINDOW = 40 | |
NORMALIZATION_RADIUS = 1 | |
FILE_DATA_OUTPUT = "out.arff" | |
FILE_DATA_CUTS = 'cut.txt' | |
FILE_NAME_PATTERN = '(?:.*/)*(.*)$' | |
# subspace mining parameters | |
MAX_SUBSPACE_SIZE = 5 | |
DEFAULT_SM_K_RANGE=[2, 4, 8] | |
HETEROGENEOUS_THRESHOLD=0.8 | |
BEAM_WIDTH=4 | |
# cjs | |
CLUMP = 2 | |
MAXMAX = 5 | |
SUBSPACE_SET_STEP = 2 | |
# class Environment(Enum): | |
# TEST = 1 | |
# PRODUCTION = 2 | |
# | |
# ENVIRONMENT = Environment.TEST | |
TRIVIAL_BINS_COUNT_LIST = [None, 5] | |
# old settings | |
TOTAL_IRRELEVANT_FEATURES = 100 if socket.gethostname() == 'push' else 3 | |
# | |
# RELEVANT_FEATURES_UPPER_BOUND=3 if socket.gethostname() != 'push' else 31 | |
# RELEVANT_FEATURES_LOWER_BOUND=2 | |
# | |
# INTERACTIONS_UPPER_BOUND=4 if socket.gethostname() != 'push' else 11 | |
# INTERACTIONS_LOWER_BOUND=3 if socket.gethostname() != 'push' else 1 | |
# new settings (more constrained) | |
# main execution | |
IRRELEVANT_FEATURES_RANGE_LIST = [1, 2, 3, 4, 8, 16, 32, 64, 99, 6, 12, 24, 48, TOTAL_IRRELEVANT_FEATURES] \ | |
if socket.gethostname() == 'push' else [1, 2, TOTAL_IRRELEVANT_FEATURES] | |
FOOTPRINTS_NUMBER_RANGE_LIST = [4, 8] | |
# datasets iterator (executes either real datasets or artificial datasets, depends on value of REAL_DATASETS) | |
REAL_DATASETS=None | |
# REAL_DATASETS=['gas', 'gas_small', 'gas_r128', 'gas_small_r128'] | |
INTERACTION_TYPE_RANGE_LIST = [InteractionType.CUBES, InteractionType.XORCUBES, | |
InteractionType.BLOBS, InteractionType.XORBLOBS, | |
# InteractionType.UNIFORM | |
] | |
XOR_OFFSETS = [0, 1] | |
XOR_RELEVANT_FEATURES_RANGE_LIST = [3, 4, 5, 6] if socket.gethostname() == 'push' else [3] | |
CUBES_RELEVANT_FEATURES_RANGE_LIST = [4, 8] if socket.gethostname() == 'push' else [4] | |
INTERACTION_NUMBER_RANGE_LIST = [1, 2] | |
CUBES_NUMBER_RANGE_LIST = [1, 2] | |
ROWS_RANGE_LIST = [1000, 5000, 10000] if socket.gethostname() == 'push' else [1000] | |
# # datasets iterator (1 dataset) | |
# INTERACTION_TYPE_RANGE_LIST = [InteractionType.CUBES | |
# # InteractionType.UNIFORM | |
# ] | |
# XOR_OFFSETS = [0, 1] | |
# XOR_RELEVANT_FEATURES_RANGE_LIST = [3, 4, 5, 6] if socket.gethostname() == 'push' else [3] | |
# CUBES_RELEVANT_FEATURES_RANGE_LIST = [4, 8] if socket.gethostname() == 'push' else [4] | |
# INTERACTION_NUMBER_RANGE_LIST = [1] | |
# CUBES_NUMBER_RANGE_LIST = [1] | |
# ROWS_RANGE_LIST = [1000, 5000, 10000, 20000] if socket.gethostname() == 'push' else [1000] | |
# todo delete later | |
NAIVE_CHUNK_SIZE_RANGE_LIST = [2, 4, 10, 20] if socket.gethostname() == 'push' else [2] | |
BASE = '/local/tmp/ipd_extended_experiments2/' if socket.gethostname() == 'push' \ | |
else '/Users/tatyanadembelova/Documents/study/thesis/ipd_extended/' | |
DATA_DIR = BASE + ('new_cubes/' if REAL_DATASETS is None else "data/") | |
PERFECT_DISCRETIZATIONS_DIR = BASE + 'ideal_disc/' | |
PERFECT_SUBSPACES_JSON = BASE + 'ideal_subspaces.json' | |
SLIM_BASE = ("/Users/tatyanadembelova/Documents/study/thesis/" if socket.gethostname() != 'push' else BASE) + "code-fic/" | |
SLIM_DATA_DIR = SLIM_BASE + "data/" | |
SLIM_BIN = SLIM_BASE + "branches/slim/trunk/fic" | |
SLIM_COMPRESS_CONF = SLIM_BASE + "branches/slim/trunk/compress.conf" | |
SLIM_CONVERT_CONF = SLIM_BASE + "branches/slim/trunk/convertdb.conf" | |
PRECISION_RECALL_FILENAME = "Precision_recall_runtime.csv" | |
COMPRESSION_FILENAME = "Compression.csv" | |
DETAILS_FILENAME = "Details.csv" | |
WEKA_BIN = "/local/tmp/ipd_extended_experiments2/weka/weka-3-9-1/weka.jar" if socket.gethostname() == 'push' else "/Users/tatyanadembelova/Downloads/weka-3-9-1/weka.jar" |