dagardner-nv
diff --git a/‎ci/vale/styles/config/vocabularies/morpheus/accept.txt
Lines changed: 5 additions & 0 deletions b/‎ci/vale/styles/config/vocabularies/morpheus/accept.txt
Lines changed: 5 additions & 0 deletions
diff --git a/‎docker/run_container.sh
Lines changed: 57 additions & 0 deletions b/‎docker/run_container.sh
Lines changed: 57 additions & 0 deletions
diff --git a/‎docker/run_container_dev.sh
Lines changed: 6 additions & 32 deletions b/‎docker/run_container_dev.sh
Lines changed: 6 additions & 32 deletions
diff --git a/‎docker/run_container_release.sh
Lines changed: 7 additions & 32 deletions b/‎docker/run_container_release.sh
Lines changed: 7 additions & 32 deletions
diff --git a/‎docs/source/conf.py
Lines changed: 1 addition & 0 deletions b/‎docs/source/conf.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/source/developer_guide/guides/2_real_world_phishing.md
Lines changed: 3 additions & 2 deletions b/‎docs/source/developer_guide/guides/2_real_world_phishing.md
Lines changed: 3 additions & 2 deletions
diff --git a/‎docs/source/developer_guide/guides/6_digital_fingerprinting_reference.md
Lines changed: 5 additions & 5 deletions b/‎docs/source/developer_guide/guides/6_digital_fingerprinting_reference.md
Lines changed: 5 additions & 5 deletions
diff --git a/‎examples/abp_pcap_detection/abp_pcap_preprocessing.py
Lines changed: 2 additions & 6 deletions b/‎examples/abp_pcap_detection/abp_pcap_preprocessing.py
Lines changed: 2 additions & 6 deletions
@@ -18,6 +18,9 @@ CMake
 Conda
 CPython
 [Cc]ryptocurrenc[y|ies]
+cuDF
+cuML
+CuPy
 [Cc]yber
 [Cc]ybersecurity
 Cython
@@ -51,7 +54,9 @@ NeMo
 nginx
 NIC
 NIM(s?)
+NumPy
 NVIDIA
+pandas
 [Pp]arallelization
 [Pp]arsable
 PCIe
 
@@ -0,0 +1,57 @@
+#!/bin/bash
+# SPDX-FileCopyrightText: Copyright (c) 2021-2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# Color variables
+b="\033[0;36m"
+g="\033[0;32m"
+r="\033[0;31m"
+e="\033[0;90m"
+y="\033[0;33m"
+x="\033[0m"
+
+_UNDEF_VAR_ERROR_MSG="Use the dev/release scripts to set these automatically"
+
+DOCKER_IMAGE_NAME=${DOCKER_IMAGE_NAME:?"Must set \$DOCKER_IMAGE_NAME. ${_UNDEF_VAR_ERROR_MSG}"}
+DOCKER_IMAGE_TAG=${DOCKER_IMAGE_TAG:?"Must set \$DOCKER_IMAGE_TAG. ${_UNDEF_VAR_ERROR_MSG}"}
+
+# DOCKER_ARGS are set by the dev/release scripts
+# DOCKER_EXTRA_ARGS are optionally set by the user
+DOCKER_ARGS=${DOCKER_ARGS:-""}
+DOCKER_ARGS="${DOCKER_ARGS} --net=host --cap-add=sys_nice ${DOCKER_EXTRA_ARGS}"
+DOCKER_EXTRA_ARGS=${DOCKER_EXTRA_ARGS:-""}
+
+if [[ -n "${CPU_ONLY}" ]]; then
+   echo -e "${b}Executing in CPU only mode${x}"
+   DOCKER_ARGS="${DOCKER_ARGS} --runtime=runc"
+else
+    echo -e "${b}Executing in GPU mode${x}"
+    DOCKER_ARGS="${DOCKER_ARGS} --runtime=nvidia --gpus=all"
+fi
+
+if [[ -n "${SSH_AUTH_SOCK}" ]]; then
+   echo -e "${b}Setting up ssh-agent auth socket${x}"
+   DOCKER_ARGS="${DOCKER_ARGS} -v $(readlink -f $SSH_AUTH_SOCK):/ssh-agent:ro -e SSH_AUTH_SOCK=/ssh-agent"
+fi
+
+echo -e "${g}Launching ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG}...${x}"
+
+# Enable command logging to show what is being executed
+set -x
+docker run ${DOCA_EXTRA_ARGS} --rm -ti ${DOCKER_ARGS} ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG} "${@:-bash}"
+
+{ EXIT_CODE=$?; set +x; } 2>/dev/null
+
+exit $EXIT_CODE
@@ -14,38 +14,12 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# set -x
+SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )"
 
-# Color variables
-b="\033[0;36m"
-g="\033[0;32m"
-r="\033[0;31m"
-e="\033[0;90m"
-y="\033[0;33m"
-x="\033[0m"
+export DOCKER_IMAGE_NAME=${DOCKER_IMAGE_NAME:-"morpheus"}
+export DOCKER_IMAGE_TAG=${DOCKER_IMAGE_TAG:-"dev-$(date +'%y%m%d')"}
 
-DOCKER_IMAGE_NAME=${DOCKER_IMAGE_NAME:-"morpheus"}
-DOCKER_IMAGE_TAG=${DOCKER_IMAGE_TAG:-"dev-$(date +'%y%m%d')"}
-DOCKER_EXTRA_ARGS=${DOCKER_EXTRA_ARGS:-""}
+export DOCKER_ARGS="-v $PWD:/workspace -v /dev/hugepages:/dev/hugepages --privileged"
 
-DOCKER_ARGS="--runtime=nvidia --env WORKSPACE_VOLUME=${PWD} -v $PWD:/workspace --net=host --gpus=all --cap-add=sys_nice"
-
-if [[ -n "${SSH_AUTH_SOCK}" ]]; then
-   echo -e "${b}Setting up ssh-agent auth socket${x}"
-   DOCKER_ARGS="${DOCKER_ARGS} -v $(readlink -f $SSH_AUTH_SOCK):/ssh-agent:ro -e SSH_AUTH_SOCK=/ssh-agent"
-fi
-
-echo -e "${g}Launching ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG}...${x}"
-
-set -x
-docker run \
-    -v /dev/hugepages:/dev/hugepages \
-    --privileged \
-    --rm \
-    -ti \
-    ${DOCKER_ARGS} ${DOCKER_EXTRA_ARGS} \
-    ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG} "${@:-bash}"
-
-{ EXIT_CODE=$?; set +x; } 2>/dev/null
-
-exit $EXIT_CODE
+# Call the general run script
+${SCRIPT_DIR}/run_container.sh
@@ -16,48 +16,23 @@
 
 SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )"
 
-# Color variables
-b="\033[0;36m"
-g="\033[0;32m"
-r="\033[0;31m"
-e="\033[0;90m"
-y="\033[0;33m"
-x="\033[0m"
-
 # Change to the script file to ensure we are in the correct repo (in case were in a submodule)
 pushd ${SCRIPT_DIR} &> /dev/null
 
 MORPHEUS_SUPPORT_DOCA=${MORPHEUS_SUPPORT_DOCA:-OFF}
-MORPHEUS_BUILD_MORPHEUS_LLM=${MORPHEUS_BUILD_MORPHEUS_LLM:-ON}
-MORPHEUS_BUILD_MORPHEUS_DFP=${MORPHEUS_BUILD_MORPHEUS_DFP:-ON}
-
-DOCKER_IMAGE_NAME=${DOCKER_IMAGE_NAME:-"nvcr.io/nvidia/morpheus/morpheus"}
-DOCKER_IMAGE_TAG=${DOCKER_IMAGE_TAG:-"$(git describe --tags --abbrev=0)-runtime"}
 
-# This variable is used for passing extra arguments to the docker run command. Do not use DOCKER_ARGS for this purpose.
-DOCKER_EXTRA_ARGS=${DOCKER_EXTRA_ARGS:-""}
+export DOCKER_IMAGE_NAME=${DOCKER_IMAGE_NAME:-"nvcr.io/nvidia/morpheus/morpheus"}
+export DOCKER_IMAGE_TAG=${DOCKER_IMAGE_TAG:-"$(git describe --tags --abbrev=0)-runtime"}
 
 popd &> /dev/null
 
-DOCKER_ARGS="--runtime=nvidia --env WORKSPACE_VOLUME=${PWD} --net=host --gpus=all --cap-add=sys_nice ${DOCKER_EXTRA_ARGS}"
-
-if [[ -n "${SSH_AUTH_SOCK}" ]]; then
-   echo -e "${b}Setting up ssh-agent auth socket${x}"
-   DOCKER_ARGS="${DOCKER_ARGS} -v $(readlink -f $SSH_AUTH_SOCK):/ssh-agent:ro -e SSH_AUTH_SOCK=/ssh-agent"
-fi
-
-# DPDK requires hugepage and privileged container
-DOCA_EXTRA_ARGS=""
+# DPDK (and thus DOCA) requires hugepage and privileged container
+export DOCKER_ARGS=""
 if [[ ${MORPHEUS_SUPPORT_DOCA} == @(TRUE|ON) ]]; then
-   echo -e "${b}Enabling DOCA Support. Mounting /dev/hugepages and running in privileged mode${x}"
+   echo -e "Enabling DOCA Support. Mounting /dev/hugepages and running in privileged mode"
 
    DOCKER_ARGS="${DOCKER_ARGS} -v /dev/hugepages:/dev/hugepages --privileged"
 fi
 
-
-echo -e "${g}Launching ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG}...${x}"
-
-# Enable command logging to show what is being executed
-set -x
-docker run ${DOCA_EXTRA_ARGS} --rm -ti ${DOCKER_ARGS} ${DOCKER_IMAGE_NAME}:${DOCKER_IMAGE_TAG} "${@:-bash}"
-set +x
+# Call the general run script
+${SCRIPT_DIR}/run_container.sh
@@ -199,6 +199,7 @@
     r'^http://$',
     r'^https://$',
     r'https://(platform\.)?openai.com',
+    r'https://code.visualstudio.com'
 ]
 
 # Add any paths that contain templates here, relative to this directory.
 
@@ -980,7 +980,7 @@ The code for our sink will be similar to other stages with a few changes. First,
 
 ```python
 @register_stage("to-rabbitmq")
-class WriteToRabbitMQStage(PassThruTypeMixin, SinglePortStage):
+class WriteToRabbitMQStage(PassThruTypeMixin, GpuAndCpuMixin, SinglePortStage):
 ```
 
 Our sink will function as a pass-through allowing the possibility of other sinks to be added to the pipeline. We could, hypothetically, have a pipeline where we emit the results to both RabbitMQ and a file. For this reason we will also be using the `PassThruTypeMixin`.
@@ -1032,14 +1032,15 @@ import pika
 from morpheus.cli.register_stage import register_stage
 from morpheus.config import Config
 from morpheus.messages.message_meta import MessageMeta
+from morpheus.pipeline.execution_mode_mixins import GpuAndCpuMixin
 from morpheus.pipeline.pass_thru_type_mixin import PassThruTypeMixin
 from morpheus.pipeline.single_port_stage import SinglePortStage
 
 logger = logging.getLogger(__name__)
 
 
 @register_stage("to-rabbitmq")
-class WriteToRabbitMQStage(PassThruTypeMixin, SinglePortStage):
+class WriteToRabbitMQStage(PassThruTypeMixin, GpuAndCpuMixin, SinglePortStage):
     """
     Source stage used to load messages from a RabbitMQ queue.
 
 
@@ -88,15 +88,15 @@ Defines a single column and type-cast.
 | Argument | Type | Description |
 | -------- | ---- | ----------- |
 | `name` | `str` | Name of the column |
-| `dtype` | `str` or Python type | Any type string or Python class recognized by [Pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
+| `dtype` | `str` or Python type | Any type string or Python class recognized by [pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
 
 #### Custom Column (`CustomColumn`)
 Subclass of `ColumnInfo`, defines a column to be computed by a user-defined function `process_column_fn`.
 
 | Argument | Type | Description |
 | -------- | ---- | ----------- |
 | `name` | `str` | Name of the column |
-| `dtype` | `str` or Python type | Any type string or Python class recognized by [Pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
+| `dtype` | `str` or Python type | Any type string or Python class recognized by [pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
 | `process_column_fn` | `function` | Function which receives the entire `DataFrame` as its only input, returning a new [`pandas.Series`](https://pandas.pydata.org/docs/reference/api/pandas.Series.html) object to be stored in column `name`. |
 | `input_column_types` | `dict[str, str]` | The input columns and the expected [`dtype` strings](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) that are needed for this Column to successfully process. Setting this as `None` will pass all columns. Specifying which columns are needed improves performance. |
 
@@ -139,7 +139,7 @@ Subclass of `RenameColumn`, specific to casting UTC localized `datetime` values.
 | Argument | Type | Description |
 | -------- | ---- | ----------- |
 | `name` | `str` | Name of the destination column |
-| `dtype` | `str` or Python type | Any type string or Python class recognized by [Pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
+| `dtype` | `str` or Python type | Any type string or Python class recognized by [pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
 | `input_name` | `str` | Original column name |
 
 #### String-Join Column (`StringJoinColumn`)
@@ -148,7 +148,7 @@ Subclass of `RenameColumn`, converts incoming `list` values to string by joining
 | Argument | Type | Description |
 | -------- | ---- | ----------- |
 | `name` | `str` | Name of the destination column |
-| `dtype` | `str` or Python type | Any type string or Python class recognized by [Pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
+| `dtype` | `str` or Python type | Any type string or Python class recognized by [pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
 | `input_name` | `str` | Original column name |
 | `sep` | `str` | Separator string to use for the join |
 
@@ -158,7 +158,7 @@ Subclass of `ColumnInfo`, concatenates values from multiple columns into a new s
 | Argument | Type | Description |
 | -------- | ---- | ----------- |
 | `name` | `str` | Name of the destination column |
-| `dtype` | `str` or Python type | Any type string or Python class recognized by [Pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
+| `dtype` | `str` or Python type | Any type string or Python class recognized by [pandas](https://pandas.pydata.org/docs/user_guide/basics.html#dtypes) |
 | `input_columns` | `List[str]` | List of columns to concatenate |
 | `sep` | `str` | Separator string |
 
 
@@ -16,17 +16,16 @@
 from functools import partial
 
 import cupy as cp
-import mrc
 import numpy as np
 
 import cudf
 
-import morpheus._lib.messages as _messages
 from morpheus.cli.register_stage import register_stage
 from morpheus.common import TypeId
 from morpheus.config import Config
 from morpheus.config import PipelineModes
 from morpheus.messages import ControlMessage
+from morpheus.messages import InferenceMemoryFIL
 from morpheus.stages.preprocess.preprocess_base_stage import PreprocessBaseStage
 
 
@@ -184,7 +183,7 @@ def round_time_kernel(timestamp, rollup_time, secs):
         seq_ids[:, 2] = fea_len - 1
 
         # Create the inference memory. Keep in mind count here could be > than input count
-        memory = _messages.InferenceMemoryFIL(count=count, input__0=data, seq_ids=seq_ids)
+        memory = InferenceMemoryFIL(count=count, input__0=data, seq_ids=seq_ids)
 
         infer_message = ControlMessage(msg)
         infer_message.payload(meta)
@@ -197,6 +196,3 @@ def _get_preprocess_fn(self) -> typing.Callable[[ControlMessage], ControlMessage
                        fea_len=self._fea_length,
                        fea_cols=self.features,
                        req_cols=self.req_cols)
-
-    def _get_preprocess_node(self, builder: mrc.Builder):
-        raise NotImplementedError("C++ node not implemented for this stage")
Original file line number	Diff line number	Diff line change
`@@ -199,6 +199,7 @@`
`199`	`199`	`r'^http://$',`
`200`	`200`	`r'^https://$',`
`201`	`201`	`r'https://(platform\.)?openai.com',`
	`202`	`+ r'https://code.visualstudio.com'`
`202`	`203`	`]`
`203`	`204`
`204`	`205`	`# Add any paths that contain templates here, relative to this directory.`