Changing sensitive hashtags to communal hashtags

Question

Changing sensitive hashtags to communal hashtags

Closed this issue 5 years ago · 4 comments

Details of db for changing the sensitive to communal:

token_communal_count1   
token_communal_count_perday 
token_communal_hourwise

location

location_token_communal1
location_token_communal1_hourwise
location_token_communal1_perday

Changes to be done in public dashboard, trend analysis and location monitor

4nuragk commented 5 years ago

Done

Answer 1 · 2020-06-01T21:44:27.000Z

#48 solved in the public dash

Answer 2 · 2020-06-01T21:46:56.000Z

Needs to be done in location monitor and trend analysis

Answer 3 · 2020-06-14T15:28:43.000Z

Schema:

CREATE TABLE processed_keyspace.token_communal_count1 (
    created_date date,
    class int,
    created_time text,
    communal_class int,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, class, created_time, communal_class, token_name)
) WITH CLUSTERING ORDER BY (class DESC, created_time DESC, communal_class DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';
CREATE TABLE processed_keyspace.token_communal_count_perday (
    created_date date,
    class int,
    communal_class int,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, class, communal_class, token_name)
) WITH CLUSTERING ORDER BY (class DESC, communal_class DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';
CREATE TABLE processed_keyspace.token_communal_hourwise (
    created_date date,
    class int,
    created_time text,
    communal_class int,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, class, created_time, communal_class, token_name)
) WITH CLUSTERING ORDER BY (class DESC, created_time DESC, communal_class DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';
CREATE TABLE processed_keyspace.location_token_communal1 (
    created_date date,
    created_time text,
    class int,
    communal_class int,
    country text,
    state text,
    city text,
    tweet_cl_latitude double,
    tweet_cl_longitude double,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, created_time, class, communal_class, country, state, city, tweet_cl_latitude, tweet_cl_longitude, token_name)
) WITH CLUSTERING ORDER BY (created_time DESC, class DESC, communal_class DESC, country DESC, state DESC, city DESC, tweet_cl_latitude DESC, tweet_cl_longitude DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';
CREATE TABLE processed_keyspace.location_token_communal1_hourwise (
    created_date date,
    created_time text,
    class int,
    communal_class int,
    country text,
    state text,
    city text,
    tweet_cl_latitude double,
    tweet_cl_longitude double,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, created_time, class, communal_class, country, state, city, tweet_cl_latitude, tweet_cl_longitude, token_name)
) WITH CLUSTERING ORDER BY (created_time DESC, class DESC, communal_class DESC, country DESC, state DESC, city DESC, tweet_cl_latitude DESC, tweet_cl_longitude DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';
CREATE TABLE processed_keyspace.location_token_communal1_perday (
    created_date date,
    class int,
    communal_class int,
    country text,
    state text,
    city text,
    tweet_cl_latitude double,
    tweet_cl_longitude double,
    token_name text,
    count bigint,
    tweetid_list list<text>,
    PRIMARY KEY (created_date, class, communal_class, country, state, city, tweet_cl_latitude, tweet_cl_longitude, token_name)
) WITH CLUSTERING ORDER BY (class DESC, communal_class DESC, country DESC, state DESC, city DESC, tweet_cl_latitude DESC, tweet_cl_longitude DESC, token_name DESC)
    AND bloom_filter_fp_chance = 0.01
    AND caching = {'keys': 'ALL', 'rows_per_partition': 'NONE'}
    AND comment = ''
    AND compaction = {'class': 'org.apache.cassandra.db.compaction.SizeTieredCompactionStrategy', 'max_threshold': '32', 'min_threshold': '4'}
    AND compression = {'chunk_length_in_kb': '64', 'class': 'org.apache.cassandra.io.compress.LZ4Compressor'}
    AND crc_check_chance = 1.0
    AND dclocal_read_repair_chance = 0.1
    AND default_time_to_live = 0
    AND gc_grace_seconds = 864000
    AND max_index_interval = 2048
    AND memtable_flush_period_in_ms = 0
    AND min_index_interval = 128
    AND read_repair_chance = 0.0
    AND speculative_retry = '99PERCENTILE';