ipython
diff --git a/‎.github/workflows/test.yml‎
Lines changed: 21 additions & 1 deletion b/‎.github/workflows/test.yml‎
Lines changed: 21 additions & 1 deletion
diff --git a/‎docs/make.bat‎
Lines changed: 2 additions & 2 deletions b/‎docs/make.bat‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/source/examples/basic_task_label.py‎
Lines changed: 39 additions & 10 deletions b/‎docs/source/examples/basic_task_label.py‎
Lines changed: 39 additions & 10 deletions
diff --git a/‎docs/source/reference/db.md‎
Lines changed: 17 additions & 10 deletions b/‎docs/source/reference/db.md‎
Lines changed: 17 additions & 10 deletions
diff --git a/‎ipyparallel/client/client.py‎
Lines changed: 6 additions & 1 deletion b/‎ipyparallel/client/client.py‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎ipyparallel/client/view.py‎
Lines changed: 24 additions & 8 deletions b/‎ipyparallel/client/view.py‎
Lines changed: 24 additions & 8 deletions
diff --git a/‎ipyparallel/controller/dictdb.py‎
Lines changed: 2 additions & 0 deletions b/‎ipyparallel/controller/dictdb.py‎
Lines changed: 2 additions & 0 deletions
@@ -84,11 +84,14 @@ jobs:
 
       - name: Set up slurm
         if: ${{ matrix.cluster_type == 'slurm' }}
+        # docker build can lead to race condition -> image "docker.io/library/ipp-cluster:slurm": already exists
+        # see https://github.com/mlflow/mlflow/pull/20779
+        # work-a-round fix: docker compose again if first call failed
         run: |
           export DOCKER_BUILDKIT=1
           export COMPOSE_DOCKER_CLI_BUILD=1
           cd ci/slurm
-          docker compose up -d --build
+          docker compose up -d --build || docker compose up -d --build
 
       - name: Install Python (conda) ${{ matrix.python }}
         if: ${{ matrix.cluster_type == 'mpi' }}
@@ -128,6 +131,23 @@ jobs:
           pip install distributed joblib
           pip install --only-binary :all: matplotlib
 
+      - name: Start MongoDB
+        if: ${{ (! matrix.runs_on) && (! matrix.cluster_type) }} # only under linux with no cluster
+        uses: supercharge/mongodb-github-action@1.12.1 # uses latest mongodb per default
+
+      - name: Install pymongo package
+        if: ${{ (! matrix.runs_on) && (! matrix.cluster_type) }} # only under linux with no cluster
+        run: pip install pymongo
+
+      - name: Try to connect to mongodb
+        if: ${{ (! matrix.runs_on) && (! matrix.cluster_type) }} # only under linux with no cluster
+        run: |
+          python3 <<EOF
+          from pymongo import MongoClient
+          client = MongoClient('mongodb://localhost:27017/',serverSelectionTimeoutMS=1)
+          print(client.server_info())
+          EOF
+
       - name: Show environment
         run: pip freeze
 
 
@@ -4,8 +4,8 @@ pushd %~dp0
 
 REM Command file for Sphinx documentation
 
-if "%SPHINXBUILD%" == "" (
-	set SPHINXBUILD=--color -W --keep-going
+if "%SPHINXOPTS%" == "" (
+	set SPHINXOPTS=--color -W --keep-going
 )
 if "%SPHINXBUILD%" == "" (
 	set SPHINXBUILD=sphinx-build
 
@@ -1,4 +1,12 @@
-"""Basic task label example"""
+"""Basic task label example
+
+Labels can be used for identifying or semantically grouping tasks. Using the $glob operator
+relevant task records can be queried from the Task Database.
+
+Authors
+-------
+* ottointhesky
+"""
 
 import ipyparallel as ipp
 
@@ -18,13 +26,17 @@ def wait(t):
     return time.time() - tic
 
 
+count = 5  # number of tasks per method
+
 # use load balanced view
 bview = rc.load_balanced_view()
 ar_list_b1 = [
-    bview.set_flags(label=f"mylabel_map_{i:02}").map_async(wait, [2]) for i in range(10)
+    bview.set_flags(label=f"bview_map_{i:02}").map_async(wait, [2])
+    for i in range(count)
 ]
 ar_list_b2 = [
-    bview.set_flags(label=f"mylabel_map_{i:02}").apply_async(wait, 2) for i in range(10)
+    bview.set_flags(label=f"bview_apply_{i:02}").apply_async(wait, 2)
+    for i in range(count)
 ]
 bview.wait(ar_list_b1)
 bview.wait(ar_list_b2)
@@ -33,19 +45,36 @@ def wait(t):
 # use direct view
 dview = rc[:]
 ar_list_d1 = [
-    dview.set_flags(label=f"mylabel_map_{i + 10:02}").apply_async(wait, 2)
-    for i in range(10)
+    dview.set_flags(label=f"dview_map_{i + 10:02}").map_async(wait, [2])
+    for i in range(count)
 ]
 ar_list_d2 = [
-    dview.set_flags(label=f"mylabel_map_{i + 10:02}").map_async(wait, [2])
-    for i in range(10)
+    dview.set_flags(label=f"dview_apply_{i + 10:02}").apply_async(wait, 2)
+    for i in range(count)
 ]
 dview.wait(ar_list_d1)
 dview.wait(ar_list_d2)
 
+
+def print_records(titel, data):
+    print(f"{titel} ({len(data)} records)")
+    for d in data:
+        print(
+            f"\tmsg_id={d['msg_id']}; label={d['label']}; engine_uuid={d['engine_uuid']}"
+        )
+
+
+query_keys = ['msg_id', 'label', 'engine_uuid']
+
 # query database
-data = rc.db_query({'label': {"$nin": ""}}, keys=['msg_id', 'label', 'engine_uuid'])
-for d in data:
-    print(f"msg_id={d['msg_id']}; label={d['label']}; engine_uuid={d['engine_uuid']}")
+data = rc.db_query({'label': {"$nin": ""}}, keys=query_keys)
+print_records("all entries with labels", data)
+
+data = rc.db_query({'label': {"$glob": "dview_*"}}, keys=query_keys)
+print_records("all dview label entries", data)
+
+data = rc.db_query({'label': {"$glob": "*_map_*"}}, keys=query_keys)
+print_records("all map label entries", data)
 
+# stop cluster
 cluster.stop_cluster_sync()
@@ -75,19 +75,26 @@ TaskRecord keys:
 | error          | dict        | Python traceback (error message content)                    |
 | stdout         | str         | Stream of stdout data                                       |
 | stderr         | str         | Stream of stderr data                                       |
+| label          | str         | optional user-defined task identifier                       |
 
 MongoDB operators we emulate on all backends:
 
-| Operator | Python equivalent |
-| -------- | ----------------- |
-| '\$in'   | in                |
-| '\$nin'  | not in            |
-| '\$eq'   | ==                |
-| '\$ne'   | !=                |
-| '\$gt'   | >                 |
-| '\$gte'  | >=                |
-| '\$le'   | \<                |
-| '\$lte'  | \<=               |
+| Operator | Python equivalent                                                             |
+| -------- | ----------------------------------------------------------------------------- |
+| '\$in'   | in                                                                            |
+| '\$nin'  | not in                                                                        |
+| '\$eq'   | ==                                                                            |
+| '\$ne'   | !=                                                                            |
+| '\$gt'   | >                                                                             |
+| '\$gte'  | >=                                                                            |
+| '\$le'   | \<                                                                            |
+| '\$lte'  | \<=                                                                           |
+| '\$glob' | [fnmatch](https://docs.python.org/3/library/fnmatch.html) (wildcard matching) |
+
+Remarks on _$glob_: The operator can be used to find substrings in DB columns based on
+[unix style filename pattern matching](https://docs.python.org/3/library/fnmatch.html)
+_$glob_ is **not** a regular MongoDB opertor, but is internally translated to a regular
+expression (_$regex_) which is natively supported by MongoDB.
 
 The DB Query is useful for two primary cases:
 
 
@@ -1226,7 +1226,9 @@ def relay_comm(msg):
             for callback in msg_future.iopub_callbacks:
                 callback(msg)
 
-    def create_message_futures(self, msg_id, header, async_result=False, track=False):
+    def create_message_futures(
+        self, msg_id, header, async_result=False, track=False, label=None
+    ):
         msg_future = MessageFuture(msg_id, header=header, track=track)
         futures = [msg_future]
         self._futures[msg_id] = msg_future
@@ -1237,6 +1239,7 @@ def create_message_futures(self, msg_id, header, async_result=False, track=False
             # hook up metadata
             output.metadata = self.metadata[msg_id]
             output.metadata['submitted'] = util.utcnow()
+            output.metadata['label'] = label
             msg_future.output = output
             futures.append(output)
         return futures
@@ -1266,6 +1269,7 @@ def _send(
         msg_id = msg['header']['msg_id']
 
         expect_reply = msg_type not in {"comm_msg", "comm_close", "comm_open"}
+        label = metadata["label"] if metadata and "label" in metadata else None
 
         if expect_reply and track_outstanding:
             # add to outstanding, history
@@ -1289,6 +1293,7 @@ def _send(
                 msg['header'],
                 async_result=msg_type in {'execute_request', 'apply_request'},
                 track=track,
+                label=label,
             )
             if message_future_hook is not None:
                 message_future_hook(futures[0])
 
@@ -138,7 +138,7 @@ def __len__(self):
     def set_flags(self, **kwargs):
         """set my attribute flags by keyword.
 
-        Views determine behavior with a few attributes (`block`, `track`, etc.).
+        Views determine behavior with a few attributes (`block`, `track`, `label`, etc.).
         These attributes can be set all at once by name with this method.
 
         Parameters
@@ -149,6 +149,8 @@ def set_flags(self, **kwargs):
             whether to create a MessageTracker to allow the user to
             safely edit after arrays and buffers during non-copying
             sends.
+        label : str
+            set an optional user-defined task identifier
         """
         for name, value in kwargs.items():
             if name not in self._flag_names:
@@ -557,6 +559,8 @@ def _really_apply(
             whether to block
         track : bool [default: self.track]
             whether to ask zmq to track the message, for safe non-copying sends
+        label : str [default self.label]
+            set an optional user-defined task identifier
 
         Returns
         -------
@@ -642,6 +646,8 @@ def map(
             Only for zero-copy sends such as numpy arrays that are going to be modified in-place.
         return_exceptions : bool [default False]
             Return remote Exceptions in the result sequence instead of raising them.
+        label : str [default self.label]
+            set an optional user-defined task identifier
 
         Returns
         -------
@@ -672,7 +678,7 @@ def map(
 
     @sync_results
     @save_ids
-    def execute(self, code, silent=True, targets=None, block=None):
+    def execute(self, code, silent=True, targets=None, block=None, label=None):
         """Executes `code` on `targets` in blocking or nonblocking manner.
 
         ``execute`` is always `bound` (affects engine namespace)
@@ -681,18 +687,21 @@ def execute(self, code, silent=True, targets=None, block=None):
         ----------
         code : str
             the code string to be executed
-        block : bool
+        block : bool [default self.block]
             whether or not to wait until done to return
-            default: self.block
+        label : str [default self.label]
+            set an optional user-defined task identifier
         """
         block = self.block if block is None else block
         targets = self.targets if targets is None else targets
+        label = self.label if label is None else label
+        metadata = dict(label=label)
 
         _idents, _targets = self.client._build_targets(targets)
         futures = []
         for ident in _idents:
             future = self.client.send_execute_request(
-                self._socket, code, silent=silent, ident=ident
+                self._socket, code, silent=silent, ident=ident, metadata=metadata
             )
             futures.append(future)
         if isinstance(targets, int):
@@ -708,7 +717,7 @@ def execute(self, code, silent=True, targets=None, block=None):
                 pass
         return ar
 
-    def run(self, filename, targets=None, block=None):
+    def run(self, filename, targets=None, block=None, label=None):
         """Execute contents of `filename` on my engine(s).
 
         This simply reads the contents of the file and calls `execute`.
@@ -723,13 +732,15 @@ def run(self, filename, targets=None, block=None):
         block : bool
             whether or not to wait until done
             default: self.block
+        label : str
+            set an optional user-defined task identifier
 
         """
         with open(filename) as f:
             # add newline in case of trailing indented whitespace
             # which will cause SyntaxError
             code = f.read() + '\n'
-        return self.execute(code, block=block, targets=targets)
+        return self.execute(code, block=block, targets=targets, label=label)
 
     def update(self, ns):
         """update remote namespace with dict `ns`
@@ -1076,7 +1087,6 @@ def map(
         block=None,
         track=False,
         return_exceptions=False,
-        label=None,
     ):
         """Parallel version of builtin `map`, using this View's `targets`.
 
@@ -1297,6 +1307,8 @@ def set_flags(self, **kwargs):
             DependencyTimeout.
         retries : int
             Number of times a task will be retried on failure.
+        label : str
+            set an optional user-defined task identifier
         """
 
         super().set_flags(**kwargs)
@@ -1348,6 +1360,8 @@ def _really_apply(
             whether to block
         track : bool [default: self.track]
             whether to ask zmq to track the message, for safe non-copying sends
+        label : str [default self.label]
+            set an optional user-defined task identifier
         !!!!!! TODO : THE REST HERE  !!!!
 
         Returns
@@ -1470,6 +1484,8 @@ def map(
 
         return_exceptions: bool [default False]
             Return Exceptions instead of raising on the first exception.
+        label : str [default self.label]
+            set an optional user-defined task identifier
 
         Returns
         -------
 
@@ -36,6 +36,7 @@
 # Copyright (c) IPython Development Team.
 # Distributed under the terms of the Modified BSD License.
 import copy
+import fnmatch
 from copy import deepcopy
 from datetime import datetime
 
@@ -59,6 +60,7 @@
     '$all': lambda a, b: all([a in bb for bb in b]),
     '$mod': lambda a, b: a % b[0] == b[1],
     '$exists': lambda a, b: (b and a is not None) or (a is None and not b),
+    '$glob': lambda a, b: fnmatch.fnmatch(a, b) if a is not None else False,
 }
Original file line number	Diff line number	Diff line change
`@@ -4,8 +4,8 @@ pushd %~dp0`
`4`	`4`
`5`	`5`	`REM Command file for Sphinx documentation`
`6`	`6`
`7`		`-if "%SPHINXBUILD%" == "" (`
`8`		`- set SPHINXBUILD=--color -W --keep-going`
	`7`	`+if "%SPHINXOPTS%" == "" (`
	`8`	`+ set SPHINXOPTS=--color -W --keep-going`
`9`	`9`	`)`
`10`	`10`	`if "%SPHINXBUILD%" == "" (`
`11`	`11`	`set SPHINXBUILD=sphinx-build`