SwatiPanwar · December 13, 2025 18:14
diff --git a/01-Installation.md b/01-Installation.md
diff --git a/02-hello_pipeline.py b/02-hello_pipeline.py
 from kfp import dsl
 from kfp import compiler

 # Define a simple component using a Python function
 @dsl.component
 def say_hello(name: str) -> str:
    """A simple component that says hello to a given name."""
    hello_text = f'Hello, {name}!'
    print(hello_text)
    return hello_text

 # Define the pipeline using the @dsl.pipeline decorator
 @dsl.pipeline(
    name="hello-world-pipeline",
    description="A basic pipeline that prints a greeting."
 )
 def hello_pipeline(recipient: str = "World") -> str:  # Add a default value
    """This pipeline runs the say_hello component."""
    hello_task = say_hello(name=recipient)
    return hello_task.output  # Return the output of the component

 if __name__ == "__main__":
    # Compile the pipeline into a YAML file
    compiler.Compiler().compile(hello_pipeline, 'hello_world_pipeline.yaml')

    # To run the pipeline, you would typically use the Kubeflow Pipelines UI
    # or the KFP SDK Client if you have a running Kubeflow Pipelines backend:
    # from kfp.client import Client
    # client = Client(host='<YOUR-KFP-ENDPOINT>')  # Replace with your endpoint
    # run = client.create_run_from_pipeline_func(hello_pipeline, arguments={'recipient': 'Kubeflow'})
    # print(f"Pipeline run details: {run}")
diff --git a/03-irish_pipeline.py b/03-irish_pipeline.py
 import kfp
 from kfp import dsl
 from typing import NamedTuple, List

 # Step 1: Load data into memory and return as lists
 @dsl.component(
    base_image="python:3.8-slim",
    packages_to_install=["pandas", "scikit-learn"]
 )
 def load_data() -> NamedTuple("Outputs", [("features", List[List[float]]), ("labels", List[int])]):
    from sklearn.datasets import load_iris
    iris = load_iris()
    return (iris.data.tolist(), iris.target.tolist())

 # Step 2: Train model and return accuracy
 @dsl.component(
    base_image="python:3.8-slim",
    packages_to_install=["scikit-learn"]
 )
 def train_model(
    features: List[List[float]],
    labels: List[int]
 ) -> NamedTuple("Output", [("accuracy", float)]):
    from sklearn.ensemble import RandomForestClassifier
    from sklearn.model_selection import train_test_split
    from sklearn.metrics import accuracy_score

    X_train, X_test, y_train, y_test = train_test_split(features, labels, test_size=0.2)

    clf = RandomForestClassifier()
    clf.fit(X_train, y_train)
    y_pred = clf.predict(X_test)
    acc = accuracy_score(y_test, y_pred)

    print(f"Model accuracy: {acc}")
    return (acc,)

 # Step 3: Define the pipeline
 @dsl.pipeline(
    name="iris-no-artifacts-pipeline",
    description="ML pipeline without file artifacts, returns accuracy."
 )
 def iris_pipeline():
    data = load_data()
    train_model(
        features=data.outputs["features"],
        labels=data.outputs["labels"]
    )

 # Step 4: Compile
 if __name__ == "__main__":
    kfp.compiler.Compiler().compile(
        pipeline_func=iris_pipeline,
        package_path="iris_pipeline.yaml"
    )
	from kfp import dsl
	from kfp import compiler

	# Define a simple component using a Python function
	@dsl.component
	def say_hello(name: str) -> str:
	"""A simple component that says hello to a given name."""
	hello_text = f'Hello, {name}!'
	print(hello_text)
	return hello_text

	# Define the pipeline using the @dsl.pipeline decorator
	@dsl.pipeline(
	name="hello-world-pipeline",
	description="A basic pipeline that prints a greeting."
	)
	def hello_pipeline(recipient: str = "World") -> str: # Add a default value
	"""This pipeline runs the say_hello component."""
	hello_task = say_hello(name=recipient)
	return hello_task.output # Return the output of the component

	if __name__ == "__main__":
	# Compile the pipeline into a YAML file
	compiler.Compiler().compile(hello_pipeline, 'hello_world_pipeline.yaml')

	# To run the pipeline, you would typically use the Kubeflow Pipelines UI
	# or the KFP SDK Client if you have a running Kubeflow Pipelines backend:
	# from kfp.client import Client
	# client = Client(host='<YOUR-KFP-ENDPOINT>') # Replace with your endpoint
	# run = client.create_run_from_pipeline_func(hello_pipeline, arguments={'recipient': 'Kubeflow'})
	# print(f"Pipeline run details: {run}")
	import kfp
	from kfp import dsl
	from typing import NamedTuple, List

	# Step 1: Load data into memory and return as lists
	@dsl.component(
	base_image="python:3.8-slim",
	packages_to_install=["pandas", "scikit-learn"]
	)
	def load_data() -> NamedTuple("Outputs", [("features", List[List[float]]), ("labels", List[int])]):
	from sklearn.datasets import load_iris
	iris = load_iris()
	return (iris.data.tolist(), iris.target.tolist())

	# Step 2: Train model and return accuracy
	@dsl.component(
	base_image="python:3.8-slim",
	packages_to_install=["scikit-learn"]
	)
	def train_model(
	features: List[List[float]],
	labels: List[int]
	) -> NamedTuple("Output", [("accuracy", float)]):
	from sklearn.ensemble import RandomForestClassifier
	from sklearn.model_selection import train_test_split
	from sklearn.metrics import accuracy_score

	X_train, X_test, y_train, y_test = train_test_split(features, labels, test_size=0.2)

	clf = RandomForestClassifier()
	clf.fit(X_train, y_train)
	y_pred = clf.predict(X_test)
	acc = accuracy_score(y_test, y_pred)

	print(f"Model accuracy: {acc}")
	return (acc,)

	# Step 3: Define the pipeline
	@dsl.pipeline(
	name="iris-no-artifacts-pipeline",
	description="ML pipeline without file artifacts, returns accuracy."
	)
	def iris_pipeline():
	data = load_data()
	train_model(
	features=data.outputs["features"],
	labels=data.outputs["labels"]
	)

	# Step 4: Compile
	if __name__ == "__main__":
	kfp.compiler.Compiler().compile(
	pipeline_func=iris_pipeline,
	package_path="iris_pipeline.yaml"
	)