|
| 1 | +from rest_framework.views import APIView |
| 2 | +from rest_framework.response import Response |
| 3 | +from django.core.cache import cache |
| 4 | +from bims.models.dataset import Dataset |
| 5 | +from bims.models.biological_collection_record import BiologicalCollectionRecord |
| 6 | +from bims.serializers.dataset_serializer import DatasetSerializer |
| 7 | + |
| 8 | + |
| 9 | +# Cache key for GBIF dataset keys |
| 10 | +GBIF_DATASET_KEYS_CACHE_KEY = 'gbif_dataset_keys' |
| 11 | +GBIF_DATASET_KEYS_CACHE_TIMEOUT = 86400 # 24 hours |
| 12 | + |
| 13 | + |
| 14 | +def clear_dataset_cache(): |
| 15 | + """ |
| 16 | + Clear the GBIF dataset keys cache. |
| 17 | + Call this function after importing new GBIF data. |
| 18 | + """ |
| 19 | + cache.delete(GBIF_DATASET_KEYS_CACHE_KEY) |
| 20 | + |
| 21 | + |
| 22 | +class DatasetAutocompleteAPIView(APIView): |
| 23 | + """ |
| 24 | + Autocomplete API for GBIF datasets. |
| 25 | +
|
| 26 | + Query params: |
| 27 | + - q: search term for dataset name |
| 28 | + - ids: comma-separated database IDs for bootstrapping |
| 29 | + """ |
| 30 | + |
| 31 | + def get(self, request, format=None): |
| 32 | + query = request.query_params.get('q', '') |
| 33 | + ids_param = request.query_params.get('ids', '') |
| 34 | + |
| 35 | + dataset_keys = cache.get(GBIF_DATASET_KEYS_CACHE_KEY) |
| 36 | + |
| 37 | + if dataset_keys is None: |
| 38 | + dataset_keys = BiologicalCollectionRecord.objects.filter( |
| 39 | + source_collection='gbif' |
| 40 | + ).exclude( |
| 41 | + dataset_key__isnull=True |
| 42 | + ).values_list('dataset_key', flat=True).distinct() |
| 43 | + |
| 44 | + dataset_keys = list(filter(None, set(dataset_keys))) |
| 45 | + # Cache for 24 hours |
| 46 | + cache.set(GBIF_DATASET_KEYS_CACHE_KEY, dataset_keys, GBIF_DATASET_KEYS_CACHE_TIMEOUT) |
| 47 | + |
| 48 | + # Base queryset: only datasets with GBIF records |
| 49 | + base_qs = Dataset.objects.filter( |
| 50 | + uuid__in=dataset_keys |
| 51 | + ) |
| 52 | + |
| 53 | + if ids_param: |
| 54 | + # Bootstrap mode: fetch by database IDs |
| 55 | + ids_list = [int(id.strip()) for id in ids_param.split(',') if id.strip()] |
| 56 | + datasets = base_qs.filter(id__in=ids_list) |
| 57 | + else: |
| 58 | + # Search mode: filter by name |
| 59 | + if len(query) < 2: |
| 60 | + return Response([]) |
| 61 | + datasets = base_qs.filter(name__icontains=query).distinct()[:10] |
| 62 | + |
| 63 | + serializer = DatasetSerializer(datasets, many=True) |
| 64 | + return Response(serializer.data) |
0 commit comments