8
8
This module create tags.
9
9
10
10
"""
11
- import redis
12
-
13
11
import time
14
- import datetime
15
12
16
13
from pubsublogger import publisher
17
14
from Helper import Process
18
- from packages import Paste
19
- from packages import Item
20
-
21
-
22
- def get_item_date (item_filename ):
23
- l_directory = item_filename .split ('/' )
24
- return '{}{}{}' .format (l_directory [- 4 ], l_directory [- 3 ], l_directory [- 2 ])
25
-
26
- def set_tag_metadata (tag , date ):
27
- # First time we see this tag ## TODO: filter paste from the paste ?
28
- if not server .hexists ('tag_metadata:{}' .format (tag ), 'first_seen' ):
29
- server .hset ('tag_metadata:{}' .format (tag ), 'first_seen' , date )
30
- # Check and Set tag last_seen
31
- last_seen = server .hget ('tag_metadata:{}' .format (tag ), 'last_seen' )
32
- if last_seen is None or date > last_seen :
33
- server .hset ('tag_metadata:{}' .format (tag ), 'last_seen' , date )
15
+ from packages import Tag
34
16
35
17
if __name__ == '__main__' :
36
18
@@ -45,18 +27,6 @@ def set_tag_metadata(tag, date):
45
27
# Setup the I/O queues
46
28
p = Process (config_section )
47
29
48
- server = redis .StrictRedis (
49
- host = p .config .get ("ARDB_Tags" , "host" ),
50
- port = p .config .get ("ARDB_Tags" , "port" ),
51
- db = p .config .get ("ARDB_Tags" , "db" ),
52
- decode_responses = True )
53
-
54
- server_metadata = redis .StrictRedis (
55
- host = p .config .get ("ARDB_Metadata" , "host" ),
56
- port = p .config .get ("ARDB_Metadata" , "port" ),
57
- db = p .config .get ("ARDB_Metadata" , "db" ),
58
- decode_responses = True )
59
-
60
30
# Sent to the logging a description of the module
61
31
publisher .info ("Tags module started" )
62
32
@@ -71,27 +41,8 @@ def set_tag_metadata(tag, date):
71
41
continue
72
42
73
43
else :
74
- tag , path = message .split (';' )
75
- # add the tag to the tags word_list
76
- res = server .sadd ('list_tags' , tag )
77
- if res == 1 :
78
- print ("new tags added : {}" .format (tag ))
79
- # add the path to the tag set
80
- #curr_date = datetime.date.today().strftime("%Y%m%d")
81
- item_date = get_item_date (path )
82
- res = server .sadd ('{}:{}' .format (tag , item_date ), path )
83
- if res == 1 :
84
- print ("new paste: {}" .format (path ))
85
- print (" tagged: {}" .format (tag ))
86
- set_tag_metadata (tag , item_date )
87
- server_metadata .sadd ('tag:{}' .format (path ), tag )
88
-
89
- # Domain Object
90
- if Item .is_crawled (path ) and tag != 'infoleak:submission="crawler"' :
91
- domain = Item .get_item_domain (path )
92
- server_metadata .sadd ('tag:{}' .format (domain ), tag )
93
- server .sadd ('domain:{}:{}' .format (tag , item_date ), domain )
44
+ print (message )
45
+ tag , item_id = message .split (';' )
94
46
95
- curr_date = datetime .date .today ().strftime ("%Y%m%d" )
96
- server .hincrby ('daily_tags:{}' .format (item_date ), tag , 1 )
47
+ Tag .add_tag ("item" , tag , item_id )
97
48
p .populate_set_out (message , 'MISP_The_Hive_feeder' )
0 commit comments