File size: 2,010 Bytes
f006f31
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
AVAILABLE_LANGUAGES = ["en", "es", "na"]  # na is a placeholder for the language detection model  # noqa: E501

DEFAULT_LABEL = "No data"

DEFAULT_SCORE = 0.0

MODEL_NAMES = {
    "bed_type": {
        "classification": "text-classification",
        "en": "travelgate/bed_type_model-classifier",
        "es": "travelgate/bed_type_model-classifier",
    },
    "room_category": {
        "classification": "text-classification",
        "en": "travelgate/room_category-classifier",
        "es": "travelgate/room_category-classifier",
    },
    "environment": {
        "classification": "text-classification",
        "en": "travelgate/room_environment-classifier",
        "es": "travelgate/room_environment-classifier",
    },
    "room_features": {
        "classification": "token-classification",
        "en": "travelgate/feature_predicted_en",
        "es": "travelgate/feature_predicted_es",
    },
    "room_type": {
        "classification": "text-classification",
        "en": "travelgate/room_type-classifier",
        "es": "travelgate/room_type-classifier"
    },
    "room_view": {
        "classification": "token-classification",
        "en": "travelgate/view_predicted_en",
        "es": "travelgate/view_predicted_es"
    },
    "lang_detect": {
        "classification": "text-classification",
        "na": "papluca/xlm-roberta-base-language-detection",  # use na as a placeholder
    }
}

SPANISH_KEYWORDS = [
    "habitacion", "cama", "bano", "aire acondicionado", "television", "desayuno",
    "vista", "servicio", "caja fuerte", "ducha", "sabanas", "toallas",
    "limpieza", "recepcion", "piscina", "gimnasio", "ascensor", "estacionamiento",
    "secador de pelo", "armario", "escritorio", "telefono", "decoracion", "silla",
    "mesa", "luz", "ventana", "apartamento", "casa", "vistas", "presidencial",
    "estandar", "estudio", "terraza", "doble"
]

ENGLISH_KEYWORDS = {
    "apartment", "room", "house", "views", "presidential", "studio", "suite",
    "standard", "deluxe"
}