| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | from django.db.models.signals import post_save, pre_delete | 
					
						
							|  |  |  | from django.db.models import Q | 
					
						
							|  |  |  | import peeringdb_server.rest | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  | from peeringdb_server.models import ( | 
					
						
							|  |  |  |     UTC, | 
					
						
							|  |  |  |     InternetExchange, | 
					
						
							|  |  |  |     Network, | 
					
						
							|  |  |  |     Facility, | 
					
						
							|  |  |  |     Organization, | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | import re | 
					
						
							|  |  |  | import time | 
					
						
							|  |  |  | import datetime | 
					
						
							| 
									
										
										
										
											2019-05-02 15:20:20 +00:00
										 |  |  | import unidecode | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-05-02 15:20:20 +00:00
										 |  |  | def unaccent(v): | 
					
						
							|  |  |  |     return unidecode.unidecode(v).lower() | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | # SEARCH INDEX BE STORED HERE | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | SEARCH_CACHE = {"search_index": {}, "time": 0} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | # We want to hook searchable objects into save and delete signals | 
					
						
							|  |  |  | # so we can update the search index as the data changes without having | 
					
						
							|  |  |  | # to reload the entire thing all the time | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def hook_save(sender, **kwargs): | 
					
						
							|  |  |  |     obj = kwargs.get("instance") | 
					
						
							|  |  |  |     tag = obj._handleref.tag | 
					
						
							|  |  |  |     idx = SEARCH_CACHE.get("search_index") | 
					
						
							|  |  |  |     if obj.status == "ok": | 
					
						
							|  |  |  |         if tag not in idx: | 
					
						
							|  |  |  |             idx[tag] = {} | 
					
						
							|  |  |  |         idx.get(tag)[obj.id] = obj | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |     #        print "%d %s refreshed in search index" % (obj.id, tag) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |     else: | 
					
						
							|  |  |  |         try: | 
					
						
							|  |  |  |             del idx[tag][obj.id] | 
					
						
							|  |  |  |         except KeyError: | 
					
						
							|  |  |  |             pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #        print "%d %s delete from search index" % (obj.id, tag) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def hook_delete(sender, **kwargs): | 
					
						
							|  |  |  |     obj = kwargs.get("instance") | 
					
						
							|  |  |  |     tag = obj._handleref.tag | 
					
						
							|  |  |  |     try: | 
					
						
							|  |  |  |         del SEARCH_CACHE.get["search_index"][tag][obj.id] | 
					
						
							|  |  |  |     except TypeError: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  |     except KeyError: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #    print "%d %s deleted from search index " % (obj.id, tag) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  | searchable_models = [InternetExchange, Network, Facility, Organization] | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | for model in searchable_models: | 
					
						
							|  |  |  |     post_save.connect(hook_save, sender=model) | 
					
						
							|  |  |  |     pre_delete.connect(hook_delete, sender=model) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def search(term): | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Search searchable objects (ixp, network, facility ...) by term | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Returns result dict | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |     search_tags = ("fac", "ix", "net", "org") | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |     ref_dict = peeringdb_server.rest.ref_dict() | 
					
						
							|  |  |  |     t = time.time() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if not SEARCH_CACHE.get("search_index"): | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # whole db takes 5ish seconds, too slow to cache inline here | 
					
						
							|  |  |  |         search_index = { | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |             tag: {obj.id: obj for obj in model.objects.filter(status__in=["ok"])} | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |             for tag, model in list(ref_dict.items()) | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |             if tag in search_tags | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |         for typ, stor in list(search_index.items()): | 
					
						
							|  |  |  |             print("CACHED: %d items in %s" % (len(stor), typ)) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |         tag_id_re = re.compile(r"(" + r"|".join(search_tags) + r"|asn|as)(\d+)") | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         # FIXME: for now lets force a flush every 120 seconds, might want to look | 
					
						
							|  |  |  |         # at an event based update solution instead | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |         SEARCH_CACHE.update( | 
					
						
							|  |  |  |             search_index=search_index, time=t, update_t=t, tag_id_re=tag_id_re | 
					
						
							|  |  |  |         ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |     else: | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |         search_index = SEARCH_CACHE.get("search_index") | 
					
						
							|  |  |  |         tag_id_re = SEARCH_CACHE.get("tag_id_re") | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # while we are using signals to make sure that the search index gets updated whenever | 
					
						
							|  |  |  |     # a model is saved, right now we still have updates from external sources | 
					
						
							|  |  |  |     # to which those signals cannot be easily connected (importer, fac_merge command etc.) | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # in order to reflect search index changes made by external sources | 
					
						
							|  |  |  |     # we need to find new / updated object regularily and update the | 
					
						
							|  |  |  |     # search index from that | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # FIXME: this can be taken out when we turn the importer off - or just leave it | 
					
						
							|  |  |  |     # in as a fail-safe as it is fairly unobtrusive | 
					
						
							|  |  |  |     ut = SEARCH_CACHE.get("update_t", 0) | 
					
						
							|  |  |  |     if t - ut > 600: | 
					
						
							|  |  |  |         dut = datetime.datetime.fromtimestamp(ut).replace(tzinfo=UTC()) | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |         print("Updating search index with newly created/updates objects") | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |         search_index_update = { | 
					
						
							|  |  |  |             tag: { | 
					
						
							|  |  |  |                 obj.id: obj | 
					
						
							|  |  |  |                 for obj in model.objects.filter( | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                     Q(created__gte=dut) | Q(updated__gte=dut) | 
					
						
							|  |  |  |                 ).filter(status="ok") | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |             } | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |             for tag, model in list(ref_dict.items()) | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |             if tag in search_tags | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |         for tag, objects in list(search_index_update.items()): | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |             if tag not in SEARCH_CACHE["search_index"]: | 
					
						
							|  |  |  |                 SEARCH_CACHE["search_index"][tag] = dict( | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                     [(obj.id, obj) for obj in ref_dict[tag].objects.filter(status="ok")] | 
					
						
							|  |  |  |                 ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |             SEARCH_CACHE["search_index"][tag].update(objects) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         SEARCH_CACHE["update_t"] = t | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # FIXME: for some reason this gets unset sometimes - need to figure out | 
					
						
							|  |  |  |     # why - for now just recreate when its missing | 
					
						
							|  |  |  |     if not tag_id_re: | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |         tag_id_re = re.compile(r"(" + r"|".join(search_tags) + r"|asn|as)(\d+)") | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |         SEARCH_CACHE["tag_id_re"] = tag_id_re | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |     print("Search index retrieval took %.5f seconds" % (time.time() - t)) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |     result = {tag: [] for tag, model in list(ref_dict.items())} | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-05-02 15:20:20 +00:00
										 |  |  |     term = unaccent(term) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # try to convert to int for numeric search matching | 
					
						
							|  |  |  |     typed_q = {} | 
					
						
							|  |  |  |     try: | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |         typed_q["int"] = int(term) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |     except ValueError: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # check for ref tags | 
					
						
							|  |  |  |     try: | 
					
						
							|  |  |  |         match = tag_id_re.match(term) | 
					
						
							|  |  |  |         if match: | 
					
						
							|  |  |  |             typed_q[match.group(1)] = match.group(2) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     except ValueError: | 
					
						
							|  |  |  |         pass | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # FIXME  model should have a search_fields attr on it | 
					
						
							|  |  |  |     # this whole thing should be replaced with something more modular to get | 
					
						
							|  |  |  |     # rid of all the ifs | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |     for tag, index in list(search_index.items()): | 
					
						
							|  |  |  |         for id, data in list(index.items()): | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             if tag == "org": | 
					
						
							|  |  |  |                 data.org_id = data.id | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-05-02 15:20:20 +00:00
										 |  |  |             if unaccent(data.name).find(term) > -1: | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                 result[tag].append( | 
					
						
							|  |  |  |                     {"id": id, "name": data.search_result_name, "org_id": data.org_id} | 
					
						
							|  |  |  |                 ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |                 continue | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |             if hasattr(data, "name_long") and unaccent(data.name_long).find(term) > -1: | 
					
						
							|  |  |  |                 result[tag].append( | 
					
						
							|  |  |  |                     {"id": id, "name": data.search_result_name, "org_id": data.org_id} | 
					
						
							|  |  |  |                 ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |                 continue | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |             if hasattr(data, "aka") and unaccent(data.aka).find(term) > -1: | 
					
						
							|  |  |  |                 result[tag].append( | 
					
						
							|  |  |  |                     {"id": id, "name": data.search_result_name, "org_id": data.org_id} | 
					
						
							|  |  |  |                 ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |                 continue | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             if typed_q: | 
					
						
							|  |  |  |                 if tag in typed_q: | 
					
						
							|  |  |  |                     if str(data.id).startswith(typed_q[tag]): | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                         result[tag].append( | 
					
						
							|  |  |  |                             { | 
					
						
							|  |  |  |                                 "id": id, | 
					
						
							|  |  |  |                                 "name": data.search_result_name, | 
					
						
							|  |  |  |                                 "org_id": data.org_id, | 
					
						
							|  |  |  |                             } | 
					
						
							|  |  |  |                         ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |                         continue | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                 # search asn on everyting? probably just if asn in search | 
					
						
							|  |  |  |                 # fields | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                 if hasattr(data, "asn"): | 
					
						
							|  |  |  |                     asn = typed_q.get( | 
					
						
							|  |  |  |                         "as", typed_q.get("asn", str(typed_q.get("int", ""))) | 
					
						
							|  |  |  |                     ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |                     if asn and str(data.asn).startswith(asn): | 
					
						
							| 
									
										
										
										
											2019-12-05 16:57:52 +00:00
										 |  |  |                         result[tag].append( | 
					
						
							|  |  |  |                             { | 
					
						
							|  |  |  |                                 "id": id, | 
					
						
							|  |  |  |                                 "name": data.search_result_name, | 
					
						
							|  |  |  |                                 "org_id": data.org_id, | 
					
						
							|  |  |  |                             } | 
					
						
							|  |  |  |                         ) | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-01-08 13:29:58 -06:00
										 |  |  |     for k, items in list(result.items()): | 
					
						
							| 
									
										
										
										
											2018-11-08 19:45:21 +00:00
										 |  |  |         result[k] = sorted(items, key=lambda row: row.get("name")) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return result |