⚡️ Build request with stream specific fields #12

All LDP stream shares standards fields This commit remove those from the stream mapping and build a request asking only for the stream specific fields.
2022-10-11 01:11:31 +02:00 · 2022-10-11 01:11:31 +02:00 · 949520d260
parent 6ed57de1aa
commit 949520d260
2 changed files with 59 additions and 49 deletions
--- a/ldpy.py
+++ b/ldpy.py
@ -113,33 +113,38 @@ def parse_args(args=sys.argv[1:]):
    return parser.parse_args(args)


-def get_last_entries(entries_nb):
+def request_last_entries(entries_nb, fields=[]):
    """Get the last n entries from a stream."""
    if entries_nb not in LAST_E_CHOICES:
        logger.critical("'%s' is not in '%s'", entries_nb, LAST_E_CHOICES)
        raise ValueError

-    logger.debug("Wait before getting '%s' entries!", entries_nb)
-    query = {"size": entries_nb}
-    last_entries = client.opnsrch_clt.search(body=query)
+    logger.debug("Requesting last '%s' entries…", entries_nb)
+    last_entries = client.opnsrch_clt.search(
+        body={"size": entries_nb, "_source": fields}
+    )
+
    logger.debug(pf(last_entries))

    return last_entries["hits"]["hits"]


-def get_map_props():
+def request_map_props():
    """Get stream mapping.

    LDP indices are rolling and LDP do not implement the call
    to get indices related to an alias.
    """
+    logger.debug("Requesting mapping for '%s' stream…", client.LDP_STREAM_NAME)
+
    try:
        indices = list(client.opnsrch_clt.indices.get_alias("*"))
        mapping = client.opnsrch_clt.indices.get_mapping(client.LDP_ALIAS)[indices[0]][
            "mappings"
        ]
        map_props = sorted(list(mapping["properties"]))
-        logger.debug("Mapping found for alias: '%s'", client.LDP_ALIAS)
+        logger.debug("Mapping received for alias: '%s'", client.LDP_ALIAS)
+        logger.debug(map_props)

    except AuthorizationException:
        map_props = None
@ -148,33 +153,31 @@ def get_map_props():
    return map_props


-def strip_std_field(initial_entries):
+def strip_std_field(fields):
    """Remove standard LDP fields to ease human reading.

-    Returns a list populated with a dict for each entry.
+    Returns a list populated with a list of stream specific fields.
    """
-    stripped_entries = []
-    for initial_hit in initial_entries:
+    for field in STD_FIELDS:
+        fields.remove(field)

-        for key in STD_FIELDS:
-            del initial_hit["_source"][key]
-
-        stripped_entries.append(initial_hit["_source"])
-
-    return stripped_entries
+    return fields


 def main(options):
    """Execute as script. Functions related to the arguments passed."""
    if options.mapping:
-        response = get_map_props()
-        logger.debug("Mapping for '%s' stream: %s", client.LDP_STREAM_NAME, response)
+        response = request_map_props()
+
    elif options.last:
-        response = strip_std_field(get_last_entries(options.last))
+        response = request_last_entries(
+            options.last, strip_std_field(request_map_props())
+        )
        logger.debug(
            "Last '%s' entries for '%s' stream:", options.last, client.LDP_STREAM_NAME
        )
        logger.debug(response)
+
    else:
        raise NotImplementedError

--- a/tests_ldpy.py
+++ b/tests_ldpy.py
@ -19,6 +19,7 @@ from ldpy import LAST_E_CHOICES, STD_FIELDS
 LAST_E_MIN = LAST_E_CHOICES[0] - 1
 LAST_E_MAX = len(LAST_E_CHOICES) + 1
 META_FIELDS = ["_id", "_source", "_shards", "hits"]
+DEMO_STREAM_FIELDS = ["rating_num", "message", "title", "id", "category"]


 # Faking options from argparse
@ -89,51 +90,57 @@ def test_parse_args_last_const():
 # ###
@mark.parametrize("fields", [META_FIELDS, STD_FIELDS])
 def test_strip_std_field(fields):
-    """Remove keys/values present in all LDP stream."""
+    """Remove fields present in all LDP stream."""
    payload = [
-        {
-            "_id": "-",
-            "_source": {
-                "category": "-",
-                "gl2_source_input": "",
-                "gl2_source_node": "-",
-                "id": "-",
-                "message": "-",
-                "rating_num": 42,
-                "source": "-",
-                "streams": [""],
-                "timestamp": "2022-10-04 20:59:22.364402",
-                "title": "-",
-                "X-OVH-CONTENT-SIZE": 42,
-                "X-OVH-DELIVERY-DATE": "2022-10-04T20:59:22.578894878Z",
-                "X-OVH-INPUT": "",
-            },
-        },
+        "category",
+        "gl2_source_input",
+        "gl2_source_node",
+        "id",
+        "message",
+        "rating_num",
+        "source",
+        "streams",
+        "timestamp",
+        "title",
+        "X-OVH-CONTENT-SIZE",
+        "X-OVH-DELIVERY-DATE",
+        "X-OVH-INPUT",
    ]
-    stripped_entry = ldpy.strip_std_field(payload)[0]
+    stripped_entry = ldpy.strip_std_field(payload)

-    assert isinstance(stripped_entry, dict)
+    assert isinstance(stripped_entry, list)

    for field in fields:
        assert field not in stripped_entry


 # ###
-# Testing get_last_entries()
+# Testing request_last_entries()
 # ###
-@mark.parametrize("entry_np", [LAST_E_MIN, LAST_E_MAX])
-def test_get_last_entries_out_of_range(entry_np):
+@mark.parametrize("opt_last", [LAST_E_MIN, LAST_E_MAX])
+def test_request_last_entries_out_of_range(opt_last):
    """Value is out of range for the last entries."""
    with raises(ValueError):
-        ldpy.get_last_entries(entry_np)
+        ldpy.request_last_entries(opt_last)


@pytest.mark.vcr()
-@mark.parametrize("entry_np", LAST_E_CHOICES)
-def test_get_last_entries_in_range(entry_np):
+@mark.parametrize(
+    "opt_last, fields",
+    [
+        (LAST_E_CHOICES[0], DEMO_STREAM_FIELDS),
+        (len(LAST_E_CHOICES), DEMO_STREAM_FIELDS),
+    ],
+)
+def test_request_last_entries_in_range(opt_last, fields):
    """Value is in range for the last entries."""
-    response = ldpy.get_last_entries(entry_np)
-    assert len(response) == entry_np
+    response_id = opt_last - 1
+    response = ldpy.request_last_entries(opt_last, fields)
+
+    assert len(response) == opt_last
+    for field in STD_FIELDS:
+        assert field not in response[0]["_source"]
+        assert field not in response[response_id]["_source"]


 # ###
@ -151,7 +158,7 @@ def test_main_without_option():
 def test_main_demo_with_mapping():
    """Called with mapping option.

-    `main()` just tranfers `get_map_props()` return: this test is not really useful
+    `main()` just transfers `request_map_props()` return: this test is not really useful
    """
    options = FakeOptions(["mapping"])
    response = ldpy.main(options)