From 81a79c0a31a3f8dc70e515f464b876985f47a8bd Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Tue, 28 Oct 2025 00:29:51 -0400
Subject: [PATCH 01/15] feature: basic TagSet functionality

---
 alpacloud/eztag/BUILD       |  35 ++++++
 alpacloud/eztag/__init__.py |   0
 alpacloud/eztag/readme.md   |  23 ++++
 alpacloud/eztag/tag.py      |  28 +++++
 alpacloud/eztag/tag_test.py | 239 ++++++++++++++++++++++++++++++++++++
 5 files changed, 325 insertions(+)
 create mode 100644 alpacloud/eztag/BUILD
 create mode 100644 alpacloud/eztag/__init__.py
 create mode 100644 alpacloud/eztag/readme.md
 create mode 100644 alpacloud/eztag/tag.py
 create mode 100644 alpacloud/eztag/tag_test.py

diff --git a/alpacloud/eztag/BUILD b/alpacloud/eztag/BUILD
new file mode 100644
index 0000000..558d9df
--- /dev/null
+++ b/alpacloud/eztag/BUILD
@@ -0,0 +1,35 @@
+python_sources()
+
+python_tests(
+	name="tests",
+#	dependencies=["./test_resources:k8s_objs"],
+)
+
+python_test_utils(
+	name="test_utils",
+)
+
+python_distribution(
+	name="alpacloud.eztag",
+	repositories=["@alpacloud.eztag"],
+	dependencies=[":lens"],
+	long_description_path="alpacloud/eztag/readme.md",
+	provides=python_artifact(
+		name="alpacloud_eztag",
+		version="0.1.0",
+		description="A library for filtering things based on tags",
+		author="Daniel Goldman",
+		classifiers=[
+			"Development Status :: 3 - Alpha",
+			"Programming Language :: Python :: 3.10",
+			"Programming Language :: Python :: 3.11",
+			"Programming Language :: Python :: 3.12",
+			"Programming Language :: Python :: 3.13",
+			"Programming Language :: Python :: 3.14",
+			"Topic :: Utilities",
+			"Topic :: System :: Systems Administration",
+		],
+		license="Round Robin 2.0.0",
+		long_description_content_type="text/markdown",
+	),
+)
diff --git a/alpacloud/eztag/__init__.py b/alpacloud/eztag/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/alpacloud/eztag/readme.md b/alpacloud/eztag/readme.md
new file mode 100644
index 0000000..916107b
--- /dev/null
+++ b/alpacloud/eztag/readme.md
@@ -0,0 +1,23 @@
+# alpacloud.eztag
+
+`eztag` helps you easily filter things by tags. For example:
+```python
+@dataclass
+class Snippet:
+    name: str
+    content: str
+    tags: TagSet
+```
+
+you can filter them with convenient syntax:
+
+```python
+filter(lambda s: s.tags.has("python"), snippets)
+```
+
+There are several filter functions available:
+
+- has : check if a TagSet has a tag
+- match : check if a TagSet has a key with a value
+- rematch : check if a TagSet has a key with a value that matches a regex
+- contains : check if a TagSet has a key whose value contains a substring
diff --git a/alpacloud/eztag/tag.py b/alpacloud/eztag/tag.py
new file mode 100644
index 0000000..ce23283
--- /dev/null
+++ b/alpacloud/eztag/tag.py
@@ -0,0 +1,28 @@
+from __future__ import annotations
+
+import re
+from dataclasses import dataclass
+
+@dataclass
+class TagSet:
+	"""A set of tags"""
+	ts: dict[str, str | None]
+
+	def has(self, k: str) -> bool:
+		"""Check if the key exists in the tagset"""
+		return k in self.ts
+
+	def match(self, k: str, v: str) -> bool:
+		"""Exact match the value for this key"""
+		return self.ts[k] == v
+
+	def rematch(self, k: str, v: str | re.Pattern) -> bool:
+		"""Regex match the value for this key"""
+		if isinstance(v, str):
+			v = re.compile(v)
+
+		return self.has(k) and v.fullmatch(self.ts[k]) is not None
+
+	def contains(self, k: str, v: str) -> bool:
+		"""Check if the value for this key contains the substring"""
+		return self.has(k) and self.ts[k] is not None and v in self.ts[k]
diff --git a/alpacloud/eztag/tag_test.py b/alpacloud/eztag/tag_test.py
new file mode 100644
index 0000000..d9c57f8
--- /dev/null
+++ b/alpacloud/eztag/tag_test.py
@@ -0,0 +1,239 @@
+from __future__ import annotations
+
+import re
+import pytest
+
+from alpacloud.eztag.tag import TagSet
+
+
+class TestTagSetHas:
+    """Tests for TagSet.has() method"""
+
+    def test_has_returns_true_when_key_exists(self):
+        tagset = TagSet(ts={"env": "prod", "region": "us-east-1"})
+        assert tagset.has("env") is True
+
+    def test_has_returns_false_when_key_does_not_exist(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.has("region") is False
+
+    def test_has_returns_true_when_key_exists_with_none_value(self):
+        tagset = TagSet(ts={"env": None})
+        assert tagset.has("env") is True
+
+    def test_has_with_empty_tagset(self):
+        tagset = TagSet(ts={})
+        assert tagset.has("any_key") is False
+
+    def test_has_with_empty_string_key(self):
+        tagset = TagSet(ts={"": "value"})
+        assert tagset.has("") is True
+
+
+class TestTagSetMatch:
+    """Tests for TagSet.match() method"""
+
+    def test_match_returns_true_when_key_and_value_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.match("env", "prod") is True
+
+    def test_match_returns_false_when_value_does_not_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.match("env", "dev") is False
+
+    def test_match_returns_false_when_key_does_not_exist(self):
+        tagset = TagSet(ts={"env": "prod"})
+        with pytest.raises(KeyError):
+            tagset.match("region", "us-east-1")
+
+    def test_match_with_none_value(self):
+        tagset = TagSet(ts={"env": None})
+        assert tagset.match("env", None) is True
+
+    def test_match_none_value_against_string_returns_false(self):
+        tagset = TagSet(ts={"env": None})
+        assert tagset.match("env", "prod") is False
+
+    def test_match_string_value_against_none_returns_false(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.match("env", None) is False
+
+    def test_match_with_empty_string_value(self):
+        tagset = TagSet(ts={"env": ""})
+        assert tagset.match("env", "") is True
+
+    def test_match_case_sensitive(self):
+        tagset = TagSet(ts={"env": "Prod"})
+        assert tagset.match("env", "prod") is False
+        assert tagset.match("env", "Prod") is True
+
+
+class TestTagSetRematch:
+    """Tests for TagSet.rematch() method"""
+
+    def test_rematch_with_string_pattern_matches(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.rematch("env", "prod") is True
+
+    def test_rematch_with_string_pattern_does_not_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.rematch("env", "dev") is False
+
+    def test_rematch_with_regex_pattern_matches(self):
+        tagset = TagSet(ts={"env": "prod-01"})
+        assert tagset.rematch("env", r"prod-\d+") is True
+
+    def test_rematch_with_regex_pattern_does_not_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.rematch("env", r"prod-\d+") is False
+
+    def test_rematch_with_compiled_pattern_matches(self):
+        tagset = TagSet(ts={"env": "prod-01"})
+        pattern = re.compile(r"prod-\d+")
+        assert tagset.rematch("env", pattern) is True
+
+    def test_rematch_with_compiled_pattern_does_not_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        pattern = re.compile(r"prod-\d+")
+        assert tagset.rematch("env", pattern) is False
+
+    def test_rematch_returns_false_when_key_does_not_exist(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.rematch("region", "us-.*") is False
+
+    def test_rematch_with_wildcard_pattern(self):
+        tagset = TagSet(ts={"env": "production"})
+        assert tagset.rematch("env", "prod.*") is True
+
+    def test_rematch_with_alternation_pattern(self):
+        tagset = TagSet(ts={"env": "staging"})
+        assert tagset.rematch("env", "prod|staging|dev") is True
+
+    def test_rematch_requires_full_match(self):
+        tagset = TagSet(ts={"env": "my-prod-env"})
+        # Should not match because rematch uses fullmatch (not partial match)
+        assert tagset.rematch("env", "prod") is False
+        assert tagset.rematch("env", ".*prod.*") is True
+
+    def test_rematch_with_empty_string_pattern(self):
+        tagset = TagSet(ts={"env": ""})
+        assert tagset.rematch("env", "") is True
+
+    def test_rematch_with_special_regex_characters(self):
+        tagset = TagSet(ts={"version": "1.2.3"})
+        # Without escaping, '.' matches any character
+        assert tagset.rematch("version", r"1.2.3") is True
+        # With proper escaping
+        assert tagset.rematch("version", r"1\.2\.3") is True
+
+    def test_rematch_case_sensitive_by_default(self):
+        tagset = TagSet(ts={"env": "Prod"})
+        assert tagset.rematch("env", "prod") is False
+        assert tagset.rematch("env", "Prod") is True
+
+    def test_rematch_with_case_insensitive_pattern(self):
+        tagset = TagSet(ts={"env": "Prod"})
+        pattern = re.compile("prod", re.IGNORECASE)
+        assert tagset.rematch("env", pattern) is True
+
+    def test_rematch_with_none_value_fails(self):
+        tagset = TagSet(ts={"env": None})
+        # This should raise an AttributeError because None doesn't have the
+        # methods that fullmatch expects
+        with pytest.raises(TypeError):
+            tagset.rematch("env", "prod")
+
+
+class TestTagSetContains:
+    """Tests for TagSet.contains() method"""
+
+    def test_contains_returns_true_when_substring_exists(self):
+        tagset = TagSet(ts={"env": "production"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_returns_false_when_substring_does_not_exist(self):
+        tagset = TagSet(ts={"env": "production"})
+        assert tagset.contains("env", "dev") is False
+
+    def test_contains_returns_false_when_key_does_not_exist(self):
+        tagset = TagSet(ts={"env": "production"})
+        assert tagset.contains("region", "us") is False
+
+    def test_contains_with_exact_match(self):
+        tagset = TagSet(ts={"env": "prod"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_with_empty_substring(self):
+        tagset = TagSet(ts={"env": "prod"})
+        # Empty string is contained in any string
+        assert tagset.contains("env", "") is True
+
+    def test_contains_with_empty_string_value(self):
+        tagset = TagSet(ts={"env": ""})
+        assert tagset.contains("env", "") is True
+        assert tagset.contains("env", "anything") is False
+
+    def test_contains_with_none_value_returns_false(self):
+        tagset = TagSet(ts={"env": None})
+        assert tagset.contains("env", "prod") is False
+
+    def test_contains_case_sensitive(self):
+        tagset = TagSet(ts={"env": "Production"})
+        assert tagset.contains("env", "Prod") is True
+        assert tagset.contains("env", "prod") is False
+
+    def test_contains_with_substring_at_start(self):
+        tagset = TagSet(ts={"env": "production-east"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_with_substring_at_end(self):
+        tagset = TagSet(ts={"env": "my-prod"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_with_substring_in_middle(self):
+        tagset = TagSet(ts={"env": "my-prod-env"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_with_multiple_occurrences(self):
+        tagset = TagSet(ts={"env": "prod-prod-prod"})
+        assert tagset.contains("env", "prod") is True
+
+    def test_contains_with_special_characters(self):
+        tagset = TagSet(ts={"version": "v1.2.3-beta"})
+        assert tagset.contains("version", "1.2") is True
+        assert tagset.contains("version", "-beta") is True
+        assert tagset.contains("version", ".") is True
+
+    def test_contains_with_whitespace(self):
+        tagset = TagSet(ts={"description": "prod environment"})
+        assert tagset.contains("description", "prod env") is True
+        assert tagset.contains("description", " ") is True
+
+    def test_contains_does_not_treat_substring_as_regex(self):
+        tagset = TagSet(ts={"env": "prod123"})
+        # The substring is literal, not a regex pattern
+        assert tagset.contains("env", r"\d+") is False
+        assert tagset.contains("env", "prod") is True
+        assert tagset.contains("env", "123") is True
+
+
+class TestTagSetIntegration:
+    """Integration tests for TagSet"""
+
+    def test_tagset_with_multiple_operations(self):
+        tagset = TagSet(ts={
+            "env": "prod",
+            "region": "us-east-1",
+            "version": "1.2.3",
+            "team": "platform"
+        })
+
+        assert tagset.has("env")
+        assert tagset.match("env", "prod")
+        assert tagset.rematch("region", r"us-.*")
+        assert tagset.rematch("version", r"\d+\.\d+\.\d+")
+        assert not tagset.has("missing_key")
+
+    def test_tagset_empty_initialization(self):
+        tagset = TagSet(ts={})
+        assert not tagset.has("any_key")
\ No newline at end of file

From be81778b39a5d19b4504c902047927c9c92640cc Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Tue, 28 Oct 2025 01:01:37 -0400
Subject: [PATCH 02/15] feature: reimplement as MultiDict

---
 alpacloud/eztag/BUILD        |   2 +-
 alpacloud/eztag/multidict.py |  48 ++++
 alpacloud/eztag/tag.py       |  28 +-
 alpacloud/eztag/tag_test.py  | 510 +++++++++++++++++++++--------------
 4 files changed, 373 insertions(+), 215 deletions(-)
 create mode 100644 alpacloud/eztag/multidict.py

diff --git a/alpacloud/eztag/BUILD b/alpacloud/eztag/BUILD
index 558d9df..f371540 100644
--- a/alpacloud/eztag/BUILD
+++ b/alpacloud/eztag/BUILD
@@ -2,7 +2,7 @@ python_sources()
 
 python_tests(
 	name="tests",
-#	dependencies=["./test_resources:k8s_objs"],
+	# dependencies=["./test_resources:k8s_objs"],
 )
 
 python_test_utils(
diff --git a/alpacloud/eztag/multidict.py b/alpacloud/eztag/multidict.py
new file mode 100644
index 0000000..30f5d1b
--- /dev/null
+++ b/alpacloud/eztag/multidict.py
@@ -0,0 +1,48 @@
+from typing import Iterable, TypeAlias
+
+K: TypeAlias = str
+V: TypeAlias = str | None
+
+
+def _is_collection(obj):
+	"""
+	Checks if an object is an iterable collection, excluding strings and bytes.
+	"""
+	return isinstance(obj, Iterable) and not isinstance(obj, (str, bytes, bytearray))
+
+
+class MultiDict:
+	"""
+	A dictionary that allows multiple values for the same key.
+	This allows us to have a tag set like `env=prd, env=stg`
+	"""
+
+	def __init__(self):
+		self.d: dict[K, set[V]] = {}
+
+	@classmethod
+	def from_dict(cls, d: dict[K, V]):
+		md = cls()
+		for k, v in d.items():
+			md[k] = {v}
+		return md
+
+	@classmethod
+	def create(cls, d: dict[K, Iterable[V] | V]):
+		md = cls()
+		for k, vs in d.items():
+			if not _is_collection(vs):
+				n = {vs}
+			else:
+				n = set(vs)
+			md.d[k] = n
+		return md
+
+	def __getitem__(self, key):
+		return self.d[key]
+
+	def __setitem__(self, key, value):
+		self.d.setdefault(key, set()).add(value)
+
+	def __contains__(self, key):
+		return key in self.d
diff --git a/alpacloud/eztag/tag.py b/alpacloud/eztag/tag.py
index ce23283..2bc0112 100644
--- a/alpacloud/eztag/tag.py
+++ b/alpacloud/eztag/tag.py
@@ -3,26 +3,38 @@
 import re
 from dataclasses import dataclass
 
+from alpacloud.eztag.multidict import MultiDict
+
+
 @dataclass
 class TagSet:
 	"""A set of tags"""
-	ts: dict[str, str | None]
+
+	ts: MultiDict
 
 	def has(self, k: str) -> bool:
 		"""Check if the key exists in the tagset"""
 		return k in self.ts
 
-	def match(self, k: str, v: str) -> bool:
-		"""Exact match the value for this key"""
-		return self.ts[k] == v
+	def match(self, k: str, v: str | None) -> bool:
+		"""Exact match the value for this key (returns True if any value matches)"""
+		if not self.has(k):
+			return False
+		return v in self.ts[k]
 
 	def rematch(self, k: str, v: str | re.Pattern) -> bool:
-		"""Regex match the value for this key"""
+		"""Regex match the value for this key (returns True if any value matches)"""
 		if isinstance(v, str):
 			v = re.compile(v)
 
-		return self.has(k) and v.fullmatch(self.ts[k]) is not None
+		if not self.has(k):
+			return False
+
+		return any(val is not None and v.fullmatch(val) is not None for val in self.ts[k])
 
 	def contains(self, k: str, v: str) -> bool:
-		"""Check if the value for this key contains the substring"""
-		return self.has(k) and self.ts[k] is not None and v in self.ts[k]
+		"""Check if any value for this key contains the substring"""
+		if not self.has(k):
+			return False
+
+		return any(val is not None and v in val for val in self.ts[k])
diff --git a/alpacloud/eztag/tag_test.py b/alpacloud/eztag/tag_test.py
index d9c57f8..f7383aa 100644
--- a/alpacloud/eztag/tag_test.py
+++ b/alpacloud/eztag/tag_test.py
@@ -1,239 +1,337 @@
 from __future__ import annotations
 
 import re
-import pytest
 
+from alpacloud.eztag.multidict import MultiDict
 from alpacloud.eztag.tag import TagSet
 
 
 class TestTagSetHas:
-    """Tests for TagSet.has() method"""
+	"""Tests for TagSet.has() method"""
 
-    def test_has_returns_true_when_key_exists(self):
-        tagset = TagSet(ts={"env": "prod", "region": "us-east-1"})
-        assert tagset.has("env") is True
+	def test_has_returns_true_when_key_exists(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod", "region": "us-east-1"}))
+		assert tagset.has("env") is True
 
-    def test_has_returns_false_when_key_does_not_exist(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.has("region") is False
+	def test_has_returns_false_when_key_does_not_exist(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.has("region") is False
 
-    def test_has_returns_true_when_key_exists_with_none_value(self):
-        tagset = TagSet(ts={"env": None})
-        assert tagset.has("env") is True
+	def test_has_returns_true_when_key_exists_with_none_value(self):
+		tagset = TagSet(ts=MultiDict.create({"env": None}))
+		assert tagset.has("env") is True
 
-    def test_has_with_empty_tagset(self):
-        tagset = TagSet(ts={})
-        assert tagset.has("any_key") is False
+	def test_has_with_empty_tagset(self):
+		tagset = TagSet(ts=MultiDict.create({}))
+		assert tagset.has("any_key") is False
 
-    def test_has_with_empty_string_key(self):
-        tagset = TagSet(ts={"": "value"})
-        assert tagset.has("") is True
+	def test_has_with_empty_string_key(self):
+		tagset = TagSet(ts=MultiDict.create({"": "value"}))
+		assert tagset.has("") is True
+
+	def test_has_with_multiple_values_for_key(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod", "staging"]}))
+		assert tagset.has("env") is True
 
 
 class TestTagSetMatch:
-    """Tests for TagSet.match() method"""
+	"""Tests for TagSet.match() method"""
+
+	def test_match_returns_true_when_key_and_value_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.match("env", "prod") is True
+
+	def test_match_returns_false_when_value_does_not_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.match("env", "dev") is False
 
-    def test_match_returns_true_when_key_and_value_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.match("env", "prod") is True
+	def test_match_returns_false_when_key_does_not_exist(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.match("region", "us-east-1") is False
 
-    def test_match_returns_false_when_value_does_not_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.match("env", "dev") is False
+	def test_match_with_none_value(self):
+		tagset = TagSet(ts=MultiDict.create({"env": None}))
+		assert tagset.match("env", None) is True
 
-    def test_match_returns_false_when_key_does_not_exist(self):
-        tagset = TagSet(ts={"env": "prod"})
-        with pytest.raises(KeyError):
-            tagset.match("region", "us-east-1")
+	def test_match_none_value_against_string_returns_false(self):
+		tagset = TagSet(ts=MultiDict.create({"env": None}))
+		assert tagset.match("env", "prod") is False
 
-    def test_match_with_none_value(self):
-        tagset = TagSet(ts={"env": None})
-        assert tagset.match("env", None) is True
+	def test_match_string_value_against_none_returns_false(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.match("env", None) is False
 
-    def test_match_none_value_against_string_returns_false(self):
-        tagset = TagSet(ts={"env": None})
-        assert tagset.match("env", "prod") is False
+	def test_match_with_empty_string_value(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ""}))
+		assert tagset.match("env", "") is True
 
-    def test_match_string_value_against_none_returns_false(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.match("env", None) is False
+	def test_match_case_sensitive(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "Prod"}))
+		assert tagset.match("env", "prod") is False
+		assert tagset.match("env", "Prod") is True
 
-    def test_match_with_empty_string_value(self):
-        tagset = TagSet(ts={"env": ""})
-        assert tagset.match("env", "") is True
+	def test_match_with_multiple_values_matches_any(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod", "staging", "dev"]}))
+		assert tagset.match("env", "prod") is True
+		assert tagset.match("env", "staging") is True
+		assert tagset.match("env", "dev") is True
+		assert tagset.match("env", "test") is False
 
-    def test_match_case_sensitive(self):
-        tagset = TagSet(ts={"env": "Prod"})
-        assert tagset.match("env", "prod") is False
-        assert tagset.match("env", "Prod") is True
+	def test_match_with_multiple_values_including_none(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod", None]}))
+		assert tagset.match("env", "prod") is True
+		assert tagset.match("env", None) is True
+		assert tagset.match("env", "dev") is False
 
 
 class TestTagSetRematch:
-    """Tests for TagSet.rematch() method"""
-
-    def test_rematch_with_string_pattern_matches(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.rematch("env", "prod") is True
-
-    def test_rematch_with_string_pattern_does_not_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.rematch("env", "dev") is False
-
-    def test_rematch_with_regex_pattern_matches(self):
-        tagset = TagSet(ts={"env": "prod-01"})
-        assert tagset.rematch("env", r"prod-\d+") is True
-
-    def test_rematch_with_regex_pattern_does_not_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.rematch("env", r"prod-\d+") is False
-
-    def test_rematch_with_compiled_pattern_matches(self):
-        tagset = TagSet(ts={"env": "prod-01"})
-        pattern = re.compile(r"prod-\d+")
-        assert tagset.rematch("env", pattern) is True
-
-    def test_rematch_with_compiled_pattern_does_not_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        pattern = re.compile(r"prod-\d+")
-        assert tagset.rematch("env", pattern) is False
-
-    def test_rematch_returns_false_when_key_does_not_exist(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.rematch("region", "us-.*") is False
-
-    def test_rematch_with_wildcard_pattern(self):
-        tagset = TagSet(ts={"env": "production"})
-        assert tagset.rematch("env", "prod.*") is True
-
-    def test_rematch_with_alternation_pattern(self):
-        tagset = TagSet(ts={"env": "staging"})
-        assert tagset.rematch("env", "prod|staging|dev") is True
-
-    def test_rematch_requires_full_match(self):
-        tagset = TagSet(ts={"env": "my-prod-env"})
-        # Should not match because rematch uses fullmatch (not partial match)
-        assert tagset.rematch("env", "prod") is False
-        assert tagset.rematch("env", ".*prod.*") is True
-
-    def test_rematch_with_empty_string_pattern(self):
-        tagset = TagSet(ts={"env": ""})
-        assert tagset.rematch("env", "") is True
-
-    def test_rematch_with_special_regex_characters(self):
-        tagset = TagSet(ts={"version": "1.2.3"})
-        # Without escaping, '.' matches any character
-        assert tagset.rematch("version", r"1.2.3") is True
-        # With proper escaping
-        assert tagset.rematch("version", r"1\.2\.3") is True
-
-    def test_rematch_case_sensitive_by_default(self):
-        tagset = TagSet(ts={"env": "Prod"})
-        assert tagset.rematch("env", "prod") is False
-        assert tagset.rematch("env", "Prod") is True
-
-    def test_rematch_with_case_insensitive_pattern(self):
-        tagset = TagSet(ts={"env": "Prod"})
-        pattern = re.compile("prod", re.IGNORECASE)
-        assert tagset.rematch("env", pattern) is True
-
-    def test_rematch_with_none_value_fails(self):
-        tagset = TagSet(ts={"env": None})
-        # This should raise an AttributeError because None doesn't have the
-        # methods that fullmatch expects
-        with pytest.raises(TypeError):
-            tagset.rematch("env", "prod")
+	"""Tests for TagSet.rematch() method"""
+
+	def test_rematch_with_string_pattern_matches(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.rematch("env", "prod") is True
+
+	def test_rematch_with_string_pattern_does_not_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.rematch("env", "dev") is False
+
+	def test_rematch_with_regex_pattern_matches(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod-01"}))
+		assert tagset.rematch("env", r"prod-\d+") is True
+
+	def test_rematch_with_regex_pattern_does_not_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.rematch("env", r"prod-\d+") is False
+
+	def test_rematch_with_compiled_pattern_matches(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod-01"}))
+		pattern = re.compile(r"prod-\d+")
+		assert tagset.rematch("env", pattern) is True
+
+	def test_rematch_with_compiled_pattern_does_not_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		pattern = re.compile(r"prod-\d+")
+		assert tagset.rematch("env", pattern) is False
+
+	def test_rematch_returns_false_when_key_does_not_exist(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.rematch("region", "us-.*") is False
+
+	def test_rematch_with_wildcard_pattern(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "production"}))
+		assert tagset.rematch("env", "prod.*") is True
+
+	def test_rematch_with_alternation_pattern(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "staging"}))
+		assert tagset.rematch("env", "prod|staging|dev") is True
+
+	def test_rematch_requires_full_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "my-prod-env"}))
+		# Should not match because rematch uses fullmatch (not partial match)
+		assert tagset.rematch("env", "prod") is False
+		assert tagset.rematch("env", ".*prod.*") is True
+
+	def test_rematch_with_empty_string_pattern(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ""}))
+		assert tagset.rematch("env", "") is True
+
+	def test_rematch_with_special_regex_characters(self):
+		tagset = TagSet(ts=MultiDict.create({"version": "1.2.3"}))
+		# Without escaping, '.' matches any character
+		assert tagset.rematch("version", r"1.2.3") is True
+		# With proper escaping
+		assert tagset.rematch("version", r"1\.2\.3") is True
+
+	def test_rematch_case_sensitive_by_default(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "Prod"}))
+		assert tagset.rematch("env", "prod") is False
+		assert tagset.rematch("env", "Prod") is True
+
+	def test_rematch_with_case_insensitive_pattern(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "Prod"}))
+		pattern = re.compile("prod", re.IGNORECASE)
+		assert tagset.rematch("env", pattern) is True
+
+	def test_rematch_with_none_value_returns_false(self):
+		tagset = TagSet(ts=MultiDict.create({"env": None}))
+		# None values should be skipped
+		assert tagset.rematch("env", "prod") is False
+
+	def test_rematch_with_multiple_values_matches_any(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod-01", "staging-02", "dev-03"]}))
+		assert tagset.rematch("env", r"prod-\d+") is True
+		assert tagset.rematch("env", r"staging-\d+") is True
+		assert tagset.rematch("env", r"dev-\d+") is True
+		assert tagset.rematch("env", r"test-\d+") is False
+
+	def test_rematch_with_multiple_values_one_matches(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["production", "prod-01", "my-env"]}))
+		# Should match because at least one value matches
+		assert tagset.rematch("env", r"prod-\d+") is True
+
+	def test_rematch_with_multiple_values_including_none(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod-01", None, "staging"]}))
+		# Should skip None and still find matches
+		assert tagset.rematch("env", r"prod-\d+") is True
+		assert tagset.rematch("env", "staging") is True
 
 
 class TestTagSetContains:
-    """Tests for TagSet.contains() method"""
-
-    def test_contains_returns_true_when_substring_exists(self):
-        tagset = TagSet(ts={"env": "production"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_returns_false_when_substring_does_not_exist(self):
-        tagset = TagSet(ts={"env": "production"})
-        assert tagset.contains("env", "dev") is False
-
-    def test_contains_returns_false_when_key_does_not_exist(self):
-        tagset = TagSet(ts={"env": "production"})
-        assert tagset.contains("region", "us") is False
-
-    def test_contains_with_exact_match(self):
-        tagset = TagSet(ts={"env": "prod"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_with_empty_substring(self):
-        tagset = TagSet(ts={"env": "prod"})
-        # Empty string is contained in any string
-        assert tagset.contains("env", "") is True
-
-    def test_contains_with_empty_string_value(self):
-        tagset = TagSet(ts={"env": ""})
-        assert tagset.contains("env", "") is True
-        assert tagset.contains("env", "anything") is False
-
-    def test_contains_with_none_value_returns_false(self):
-        tagset = TagSet(ts={"env": None})
-        assert tagset.contains("env", "prod") is False
-
-    def test_contains_case_sensitive(self):
-        tagset = TagSet(ts={"env": "Production"})
-        assert tagset.contains("env", "Prod") is True
-        assert tagset.contains("env", "prod") is False
-
-    def test_contains_with_substring_at_start(self):
-        tagset = TagSet(ts={"env": "production-east"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_with_substring_at_end(self):
-        tagset = TagSet(ts={"env": "my-prod"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_with_substring_in_middle(self):
-        tagset = TagSet(ts={"env": "my-prod-env"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_with_multiple_occurrences(self):
-        tagset = TagSet(ts={"env": "prod-prod-prod"})
-        assert tagset.contains("env", "prod") is True
-
-    def test_contains_with_special_characters(self):
-        tagset = TagSet(ts={"version": "v1.2.3-beta"})
-        assert tagset.contains("version", "1.2") is True
-        assert tagset.contains("version", "-beta") is True
-        assert tagset.contains("version", ".") is True
-
-    def test_contains_with_whitespace(self):
-        tagset = TagSet(ts={"description": "prod environment"})
-        assert tagset.contains("description", "prod env") is True
-        assert tagset.contains("description", " ") is True
-
-    def test_contains_does_not_treat_substring_as_regex(self):
-        tagset = TagSet(ts={"env": "prod123"})
-        # The substring is literal, not a regex pattern
-        assert tagset.contains("env", r"\d+") is False
-        assert tagset.contains("env", "prod") is True
-        assert tagset.contains("env", "123") is True
+	"""Tests for TagSet.contains() method"""
+
+	def test_contains_returns_true_when_substring_exists(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "production"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_returns_false_when_substring_does_not_exist(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "production"}))
+		assert tagset.contains("env", "dev") is False
+
+	def test_contains_returns_false_when_key_does_not_exist(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "production"}))
+		assert tagset.contains("region", "us") is False
+
+	def test_contains_with_exact_match(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_empty_substring(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod"}))
+		# Empty string is contained in any string
+		assert tagset.contains("env", "") is True
+
+	def test_contains_with_empty_string_value(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ""}))
+		assert tagset.contains("env", "") is True
+		assert tagset.contains("env", "anything") is False
+
+	def test_contains_with_none_value_returns_false(self):
+		tagset = TagSet(ts=MultiDict.create({"env": None}))
+		assert tagset.contains("env", "prod") is False
+
+	def test_contains_case_sensitive(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "Production"}))
+		assert tagset.contains("env", "Prod") is True
+		assert tagset.contains("env", "prod") is False
+
+	def test_contains_with_substring_at_start(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "production-east"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_substring_at_end(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "my-prod"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_substring_in_middle(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "my-prod-env"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_multiple_occurrences(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod-prod-prod"}))
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_special_characters(self):
+		tagset = TagSet(ts=MultiDict.create({"version": "v1.2.3-beta"}))
+		assert tagset.contains("version", "1.2") is True
+		assert tagset.contains("version", "-beta") is True
+		assert tagset.contains("version", ".") is True
+
+	def test_contains_with_whitespace(self):
+		tagset = TagSet(ts=MultiDict.create({"description": "prod environment"}))
+		assert tagset.contains("description", "prod env") is True
+		assert tagset.contains("description", " ") is True
+
+	def test_contains_does_not_treat_substring_as_regex(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod123"}))
+		# The substring is literal, not a regex pattern
+		assert tagset.contains("env", r"\d+") is False
+		assert tagset.contains("env", "prod") is True
+		assert tagset.contains("env", "123") is True
+
+	def test_contains_with_multiple_values_matches_any(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["production", "staging", "development"]}))
+		assert tagset.contains("env", "prod") is True
+		assert tagset.contains("env", "stag") is True
+		assert tagset.contains("env", "dev") is True
+		assert tagset.contains("env", "test") is False
+
+	def test_contains_with_multiple_values_one_matches(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["my-env", "production", "other"]}))
+		# Should match because at least one value contains the substring
+		assert tagset.contains("env", "prod") is True
+
+	def test_contains_with_multiple_values_including_none(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["production", None, "staging"]}))
+		# Should skip None and still find matches
+		assert tagset.contains("env", "prod") is True
+		assert tagset.contains("env", "stag") is True
 
 
 class TestTagSetIntegration:
-    """Integration tests for TagSet"""
-
-    def test_tagset_with_multiple_operations(self):
-        tagset = TagSet(ts={
-            "env": "prod",
-            "region": "us-east-1",
-            "version": "1.2.3",
-            "team": "platform"
-        })
-
-        assert tagset.has("env")
-        assert tagset.match("env", "prod")
-        assert tagset.rematch("region", r"us-.*")
-        assert tagset.rematch("version", r"\d+\.\d+\.\d+")
-        assert not tagset.has("missing_key")
-
-    def test_tagset_empty_initialization(self):
-        tagset = TagSet(ts={})
-        assert not tagset.has("any_key")
\ No newline at end of file
+	"""Integration tests for TagSet"""
+
+	def test_tagset_with_multiple_operations(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "prod", "region": "us-east-1", "version": "1.2.3", "team": "platform"}))
+
+		assert tagset.has("env")
+		assert tagset.match("env", "prod")
+		assert tagset.rematch("region", r"us-.*")
+		assert tagset.rematch("version", r"\d+\.\d+\.\d+")
+		assert tagset.contains("region", "east")
+		assert tagset.contains("team", "plat")
+		assert not tagset.has("missing_key")
+
+	def test_tagset_empty_initialization(self):
+		tagset = TagSet(ts=MultiDict.create({}))
+		assert not tagset.has("any_key")
+
+	def test_contains_vs_match_vs_rematch(self):
+		tagset = TagSet(ts=MultiDict.create({"env": "my-prod-environment"}))
+
+		# match requires exact equality
+		assert not tagset.match("env", "prod")
+		assert tagset.match("env", "my-prod-environment")
+
+		# contains checks for substring
+		assert tagset.contains("env", "prod")
+		assert tagset.contains("env", "environment")
+
+		# rematch requires full regex match
+		assert not tagset.rematch("env", "prod")
+		assert tagset.rematch("env", r".*prod.*")
+		assert tagset.rematch("env", r"my-\w+-environment")
+
+	def test_tagset_with_multiple_values_per_key(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod", "staging"], "region": ["us-east-1", "us-west-2"]}))
+
+		# has() checks key existence
+		assert tagset.has("env")
+		assert tagset.has("region")
+
+		# match() returns True if ANY value matches
+		assert tagset.match("env", "prod")
+		assert tagset.match("env", "staging")
+		assert not tagset.match("env", "dev")
+
+		# rematch() returns True if ANY value matches
+		assert tagset.rematch("region", r"us-.*")
+		assert tagset.rematch("region", r".*east.*")
+		assert tagset.rematch("region", r".*west.*")
+
+		# contains() returns True if ANY value contains substring
+		assert tagset.contains("env", "prod")
+		assert tagset.contains("env", "stag")
+		assert tagset.contains("region", "east")
+		assert tagset.contains("region", "west")
+
+	def test_mixed_none_and_string_values(self):
+		tagset = TagSet(ts=MultiDict.create({"env": ["prod", None, "staging"]}))
+
+		assert tagset.has("env")
+		assert tagset.match("env", "prod")
+		assert tagset.match("env", None)
+		assert tagset.match("env", "staging")
+
+		# rematch and contains should skip None values
+		assert tagset.rematch("env", "prod")
+		assert tagset.contains("env", "prod")

From 6f00495e99ef55a2c709e3e5f5e1a2ca0c78a3f6 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 15:04:26 -0500
Subject: [PATCH 03/15] feature: basic logic operations

---
 alpacloud/eztag/logic.py | 80 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 80 insertions(+)
 create mode 100644 alpacloud/eztag/logic.py

diff --git a/alpacloud/eztag/logic.py b/alpacloud/eztag/logic.py
new file mode 100644
index 0000000..ee32910
--- /dev/null
+++ b/alpacloud/eztag/logic.py
@@ -0,0 +1,80 @@
+from abc import ABC
+from dataclasses import dataclass
+from typing import Callable
+
+from alpacloud.eztag.tag import TagSet
+
+
+class Exp(ABC):
+	"""A predicate"""
+
+	def check(self, tags: TagSet) -> bool:
+		"""Check if the condition is satisfied"""
+		raise NotImplementedError
+
+
+@dataclass(frozen=True, slots=True)
+class Cond_(Exp):
+	f: Callable[[TagSet], bool]
+
+	def check(self, tags: TagSet) -> bool:
+		return self.f(tags)
+
+
+@dataclass(frozen=True, slots=True)
+class And_(Exp):
+	conds: list[Cond_]
+
+	def check(self, tags: TagSet) -> bool:
+		return all(cond.check(tags) for cond in self.conds)
+
+
+@dataclass(frozen=True, slots=True)
+class Or_(Exp):
+	conds: list[Cond_]
+
+	def check(self, tags: TagSet) -> bool:
+		return any(cond.check(tags) for cond in self.conds)
+
+
+@dataclass(frozen=True, slots=True)
+class Not_(Exp):
+	cond: Cond_
+
+	def check(self, tags: TagSet) -> bool:
+		return not self.cond.check(tags)
+
+
+@dataclass(frozen=True, slots=True)
+class TagHas(Exp):
+	k: str
+
+	def check(self, tags: TagSet) -> bool:
+		return tags.has(self.k)
+
+
+@dataclass(frozen=True, slots=True)
+class TagMatch(Exp):
+	k: str
+	v: str | None
+
+	def check(self, tags: TagSet) -> bool:
+		return tags.match(self.k, self.v)
+
+
+@dataclass(frozen=True, slots=True)
+class TagRematch(Exp):
+	k: str
+	v: str | None
+
+	def check(self, tags: TagSet) -> bool:
+		return tags.rematch(self.k, self.v)
+
+
+@dataclass(frozen=True, slots=True)
+class TagContains(Exp):
+	k: str
+	v: str
+
+	def check(self, tags: TagSet) -> bool:
+		return tags.contains(self.k, self.v)

From d68d2a870ce2272f1ba63c685fa73b81bf65d292 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 15:04:36 -0500
Subject: [PATCH 04/15] feature: slap together a parser

---
 alpacloud/eztag/parser.py      | 135 +++++++++++++++++++++++
 alpacloud/eztag/parser_test.py | 193 +++++++++++++++++++++++++++++++++
 2 files changed, 328 insertions(+)
 create mode 100644 alpacloud/eztag/parser.py
 create mode 100644 alpacloud/eztag/parser_test.py

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
new file mode 100644
index 0000000..d8d1a6c
--- /dev/null
+++ b/alpacloud/eztag/parser.py
@@ -0,0 +1,135 @@
+from dataclasses import dataclass
+from typing import List, Optional, Union
+
+
+@dataclass
+class ParseState:
+	text: str
+	pos: int = 0
+
+	def peek(self) -> Optional[str]:
+		return self.text[self.pos] if self.pos < len(self.text) else None
+
+	def consume(self) -> Optional[str]:
+		if self.pos >= len(self.text):
+			return None
+		char = self.text[self.pos]
+		self.pos += 1
+		return char
+
+	def consume_while(self, predicate) -> str:
+		result = []
+		while self.peek() and predicate(self.peek()):
+			result.append(self.consume())
+		return ''.join(result)
+
+
+@dataclass
+class FunctionCall:
+	name: str
+	args: List[Union[str, 'FunctionCall']]
+
+
+class Parser:
+	def __init__(self, text: str):
+		self.state = ParseState(text.strip())
+
+	def parse(self) -> FunctionCall:
+		return self._parse_function_call()
+
+	def _parse_function_call(self) -> FunctionCall:
+		name = self._parse_identifier()
+		if not name:
+			raise ValueError("Expected function name")
+
+		if self.state.peek() != '(':
+			raise ValueError("Expected opening parenthesis")
+		self.state.consume()  # consume '('
+
+		args = self._parse_arguments()
+
+		if self.state.peek() != ')':
+			raise ValueError("Expected closing parenthesis")
+		self.state.consume()  # consume ')'
+
+		return FunctionCall(name, args)
+
+	def _parse_identifier(self) -> str:
+		return self.state.consume_while(lambda c: c.isalnum() or c == '_')
+
+	def _parse_arguments(self) -> List[Union[str, FunctionCall]]:
+		args = []
+		while True:
+			self.state.consume_while(str.isspace)
+
+			if self.state.peek() == ')':
+				break
+
+			arg = self._parse_argument()
+			args.append(arg)
+
+			self.state.consume_while(str.isspace)
+			if self.state.peek() == ',':
+				self.state.consume()
+			elif self.state.peek() != ')':
+				raise ValueError("Expected comma or closing parenthesis")
+
+		return args
+
+	def _parse_argument(self) -> Union[str, FunctionCall]:
+		self.state.consume_while(str.isspace)
+		
+		# Check if this argument is a function call
+		start_pos = self.state.pos
+		identifier = self._parse_identifier()
+		
+		if identifier and self.state.peek() == '(':
+			# It's a nested function call - parse it recursively
+			self.state.pos = start_pos  # Reset position
+			return self._parse_function_call()
+		else:
+			# It's a plain argument - reset and parse as string
+			self.state.pos = start_pos
+			return self._parse_plain_argument()
+
+	def _parse_plain_argument(self) -> str:
+		depth = 0
+		result = []
+		has_content = False
+
+		while self.state.peek():
+			char = self.state.peek()
+
+			if char == '(':
+				depth += 1
+			elif char == ')':
+				if depth == 0:
+					break
+				depth -= 1
+			elif char == ',' and depth == 0:
+				break
+			elif str.isspace(char) and depth == 0 and has_content:
+				# Check if there's more non-whitespace content after this space
+				# Save position to potentially restore
+				space_start = self.state.pos
+				self.state.consume_while(str.isspace)
+				
+				# If we hit a comma or closing paren, the spaces are trailing - OK
+				if self.state.peek() in (',', ')', None):
+					break
+				
+				# Otherwise, there's more content after spaces without a comma - ERROR
+				# But we need to check if it's another identifier (which would be invalid)
+				next_char = self.state.peek()
+				if next_char and (next_char.isalnum() or next_char == '_'):
+					raise ValueError("Expected comma or closing parenthesis")
+				
+				# Reset and continue consuming (for special chars in args)
+				self.state.pos = space_start
+			
+			if not str.isspace(char):
+				has_content = True
+			
+			result.append(self.state.consume())
+
+		return ''.join(result).strip()
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
new file mode 100644
index 0000000..c888f9a
--- /dev/null
+++ b/alpacloud/eztag/parser_test.py
@@ -0,0 +1,193 @@
+
+import pytest
+from alpacloud.eztag.parser import Parser, FunctionCall, ParseState
+
+
+class TestParseState:
+	"""Tests for ParseState helper class."""
+
+	def test_peek_at_beginning(self):
+		state = ParseState("hello")
+		assert state.peek() == 'h'
+		assert state.pos == 0  # peek doesn't advance
+
+	def test_peek_at_end(self):
+		state = ParseState("hi", pos=2)
+		assert state.peek() is None
+
+	def test_consume_advances_position(self):
+		state = ParseState("hello")
+		assert state.consume() == 'h'
+		assert state.pos == 1
+		assert state.consume() == 'e'
+		assert state.pos == 2
+
+	def test_consume_at_end_returns_none(self):
+		state = ParseState("a", pos=1)
+		assert state.consume() is None
+
+	def test_consume_while_with_predicate(self):
+		state = ParseState("abc123")
+		result = state.consume_while(str.isalpha)
+		assert result == "abc"
+		assert state.pos == 3
+
+	def test_consume_while_returns_empty_on_no_match(self):
+		state = ParseState("123")
+		result = state.consume_while(str.isalpha)
+		assert result == ""
+		assert state.pos == 0
+
+
+class TestParser:
+	"""Tests for Parser class."""
+
+	def test_simple_function_no_args(self):
+		parser = Parser("func()")
+		result = parser.parse()
+		assert result == FunctionCall("func", [])
+
+	def test_function_with_single_arg(self):
+		parser = Parser("func(arg1)")
+		result = parser.parse()
+		assert result == FunctionCall("func", ["arg1"])
+
+	def test_function_with_multiple_args(self):
+		parser = Parser("func(arg1, arg2, arg3)")
+		result = parser.parse()
+		assert result == FunctionCall("func", ["arg1", "arg2", "arg3"])
+
+	def test_function_with_numeric_args(self):
+		parser = Parser("add(123, 456)")
+		result = parser.parse()
+		assert result == FunctionCall("add", ["123", "456"])
+
+	def test_function_with_nested_function_call(self):
+		parser = Parser("func(nested(inner), arg2)")
+		result = parser.parse()
+		expected = FunctionCall("func", [
+			FunctionCall("nested", ["inner"]),
+			"arg2"
+		])
+		assert result == expected
+
+	def test_function_with_deeply_nested_function_calls(self):
+		parser = Parser("func(a(b(c)), d)")
+		result = parser.parse()
+		expected = FunctionCall("func", [
+			FunctionCall("a", [FunctionCall("b", ["c"])]),
+			"d"
+		])
+		assert result == expected
+
+	def test_function_with_spaces(self):
+		parser = Parser("func( arg1 , arg2 )")
+		result = parser.parse()
+		assert result == FunctionCall("func", ["arg1", "arg2"])
+
+	def test_function_with_leading_trailing_spaces(self):
+		parser = Parser("  func(arg)  ")
+		result = parser.parse()
+		assert result == FunctionCall("func", ["arg"])
+
+	def test_function_with_underscore_in_name(self):
+		parser = Parser("my_func(arg)")
+		result = parser.parse()
+		assert result == FunctionCall("my_func", ["arg"])
+
+	def test_function_with_numbers_in_name(self):
+		parser = Parser("func123(arg)")
+		result = parser.parse()
+		assert result == FunctionCall("func123", ["arg"])
+
+	def test_empty_string_raises_error(self):
+		parser = Parser("")
+		with pytest.raises(ValueError, match="Expected function name"):
+			parser.parse()
+
+	def test_missing_opening_paren_raises_error(self):
+		parser = Parser("func")
+		with pytest.raises(ValueError, match="Expected opening parenthesis"):
+			parser.parse()
+
+	def test_missing_closing_paren_raises_error(self):
+		parser = Parser("func(arg")
+		with pytest.raises(ValueError, match="Expected.*closing parenthesis"):
+			parser.parse()
+
+	def test_missing_comma_between_args_raises_error(self):
+		parser = Parser("func(arg1 arg2)")
+		with pytest.raises(ValueError, match="Expected comma or closing parenthesis"):
+			parser.parse()
+
+	def test_function_with_empty_arg_between_commas(self):
+		parser = Parser("func(arg1, , arg2)")
+		result = parser.parse()
+		# Empty string is a valid argument
+		assert result == FunctionCall("func", ["arg1", "", "arg2"])
+
+	def test_complex_nested_example(self):
+		parser = Parser("outer(inner1(a, b), inner2(c), d)")
+		result = parser.parse()
+		expected = FunctionCall("outer", [
+			FunctionCall("inner1", ["a", "b"]),
+			FunctionCall("inner2", ["c"]),
+			"d"
+		])
+		assert result == expected
+
+	def test_function_with_special_chars_in_args(self):
+		parser = Parser("func(arg-1, arg.2, arg@3)")
+		result = parser.parse()
+		assert result == FunctionCall("func", ["arg-1", "arg.2", "arg@3"])
+
+	def test_multiple_nested_levels(self):
+		parser = Parser("f1(f2(f3(f4())), x)")
+		result = parser.parse()
+		expected = FunctionCall("f1", [
+			FunctionCall("f2", [
+				FunctionCall("f3", [
+					FunctionCall("f4", [])
+				])
+			]),
+			"x"
+		])
+		assert result == expected
+
+	def test_nested_function_with_no_args(self):
+		parser = Parser("outer(inner())")
+		result = parser.parse()
+		expected = FunctionCall("outer", [FunctionCall("inner", [])])
+		assert result == expected
+
+	def test_multiple_nested_functions_as_args(self):
+		parser = Parser("func(a(), b(), c())")
+		result = parser.parse()
+		expected = FunctionCall("func", [
+			FunctionCall("a", []),
+			FunctionCall("b", []),
+			FunctionCall("c", [])
+		])
+		assert result == expected
+
+	def test_nested_with_mixed_args(self):
+		parser = Parser("outer(x, inner(y), z)")
+		result = parser.parse()
+		expected = FunctionCall("outer", [
+			"x",
+			FunctionCall("inner", ["y"]),
+			"z"
+		])
+		assert result == expected
+
+	def test_deeply_nested_with_multiple_args(self):
+		parser = Parser("a(b(c(d, e), f), g)")
+		result = parser.parse()
+		expected = FunctionCall("a", [
+			FunctionCall("b", [
+				FunctionCall("c", ["d", "e"]),
+				"f"
+			]),
+			"g"
+		])
+		assert result == expected
\ No newline at end of file

From c53bbe17845e7ec61a237d156716ffaeb640e8c5 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 16:21:44 -0500
Subject: [PATCH 05/15] feature: parse string literals and implement
 transformation into symbols

---
 alpacloud/eztag/parser.py      |  66 +++++++++++++-
 alpacloud/eztag/parser_test.py | 162 ++++++++++++++++++++++++++++-----
 2 files changed, 199 insertions(+), 29 deletions(-)

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index d8d1a6c..70fabc7 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -1,5 +1,8 @@
 from dataclasses import dataclass
-from typing import List, Optional, Union
+from typing import List, Optional, Union, Literal
+
+from alpacloud.eztag import logic
+from alpacloud.eztag.logic import Exp
 
 
 @dataclass
@@ -24,10 +27,20 @@ def consume_while(self, predicate) -> str:
 		return ''.join(result)
 
 
+@dataclass
+class StringLiteral:
+	value: str
+
+
 @dataclass
 class FunctionCall:
 	name: str
-	args: List[Union[str, 'FunctionCall']]
+	args: List[Union[str, StringLiteral, 'FunctionCall']]
+
+
+@dataclass
+class StringLiteral:
+	value: str
 
 
 class Parser:
@@ -57,7 +70,7 @@ def _parse_function_call(self) -> FunctionCall:
 	def _parse_identifier(self) -> str:
 		return self.state.consume_while(lambda c: c.isalnum() or c == '_')
 
-	def _parse_arguments(self) -> List[Union[str, FunctionCall]]:
+	def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
 		args = []
 		while True:
 			self.state.consume_while(str.isspace)
@@ -76,10 +89,10 @@ def _parse_arguments(self) -> List[Union[str, FunctionCall]]:
 
 		return args
 
-	def _parse_argument(self) -> Union[str, FunctionCall]:
+	def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
 		self.state.consume_while(str.isspace)
 		
-		# Check if this argument is a function call
+		# Check if this argument is a function call or string literal
 		start_pos = self.state.pos
 		identifier = self._parse_identifier()
 		
@@ -87,6 +100,14 @@ def _parse_argument(self) -> Union[str, FunctionCall]:
 			# It's a nested function call - parse it recursively
 			self.state.pos = start_pos  # Reset position
 			return self._parse_function_call()
+		elif identifier:
+			# It's a string literal (identifier not followed by '(')
+			# Check that we're at a valid stopping point
+			self.state.consume_while(str.isspace)
+			next_char = self.state.peek()
+			if next_char not in (',', ')', None):
+				raise ValueError("Expected comma or closing parenthesis")
+			return StringLiteral(identifier)
 		else:
 			# It's a plain argument - reset and parse as string
 			self.state.pos = start_pos
@@ -133,3 +154,38 @@ def _parse_plain_argument(self) -> str:
 			result.append(self.state.consume())
 
 		return ''.join(result).strip()
+
+
+@dataclass
+class TokenTransformation:
+	name: str
+	function: type[Exp]
+	args: list[str] | Literal["variadic"]
+
+@dataclass
+class TokenTransformer:
+	transformations: dict[str, TokenTransformation]
+
+	def transform(self, token: FunctionCall | StringLiteral) -> Exp | str:
+		if isinstance(token, StringLiteral):
+			return token.value
+
+		transformer = self.transformations[token.name]
+		if transformer.args == "variadic":
+			return transformer.function([self.transform(e) for e in token.args])
+		else:
+			raw_kwargs = dict(zip(transformer.args, token.args))
+			kwargs = {k: self.transform(v) for k, v in raw_kwargs.items()}
+			return transformer.function(**kwargs)
+
+transformer = TokenTransformer({
+	e.name:e for e in [
+		TokenTransformation("NOT", logic.Not_, ["cond"]),
+		TokenTransformation("AND", logic.And_, "variadic"),
+		TokenTransformation("OR", logic.Or_, "variadic"),
+		TokenTransformation("HAS", logic.TagHas, ["k"]),
+		TokenTransformation("MATCH", logic.TagMatch, ["k", "v"]),
+		TokenTransformation("RE", logic.TagRematch, ["k", "v"]),
+		TokenTransformation("CONTAINS", logic.TagContains, ["k", "v"]),
+	]
+})
\ No newline at end of file
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index c888f9a..c6550ea 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -1,6 +1,9 @@
+from dataclasses import dataclass
 
 import pytest
-from alpacloud.eztag.parser import Parser, FunctionCall, ParseState
+
+from alpacloud.eztag import logic
+from alpacloud.eztag.parser import Parser, FunctionCall, ParseState, StringLiteral, transformer, TokenTransformation, TokenTransformer
 
 
 class TestParseState:
@@ -39,6 +42,64 @@ def test_consume_while_returns_empty_on_no_match(self):
 		assert state.pos == 0
 
 
+class TestStringLiteral:
+	"""Tests for StringLiteral parsing."""
+
+	def test_single_string_literal(self):
+		parser = Parser("func(arg1)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [StringLiteral("arg1")])
+
+	def test_multiple_string_literals(self):
+		parser = Parser("func(arg1, arg2, arg3)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [
+			StringLiteral("arg1"),
+			StringLiteral("arg2"),
+			StringLiteral("arg3")
+		])
+
+	def test_string_literal_with_numbers(self):
+		parser = Parser("func(arg123)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [StringLiteral("arg123")])
+
+	def test_string_literal_with_underscore(self):
+		parser = Parser("func(my_arg)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [StringLiteral("my_arg")])
+
+	def test_string_literal_with_spaces(self):
+		parser = Parser("func( arg1 )")
+		result = parser.parse()
+		assert result == FunctionCall("func", [StringLiteral("arg1")])
+
+	def test_mixed_string_literals_and_function_calls(self):
+		parser = Parser("func(arg1, nested(), arg2)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [
+			StringLiteral("arg1"),
+			FunctionCall("nested", []),
+			StringLiteral("arg2")
+		])
+
+	def test_string_literal_in_nested_function(self):
+		parser = Parser("outer(inner(literal))")
+		result = parser.parse()
+		assert result == FunctionCall("outer", [
+			FunctionCall("inner", [StringLiteral("literal")])
+		])
+
+	def test_multiple_string_literals_nested(self):
+		parser = Parser("func(a, b(c, d), e)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [
+			StringLiteral("a"),
+			FunctionCall("b", [StringLiteral("c"), StringLiteral("d")]),
+			StringLiteral("e")
+		])
+
+
 class TestParser:
 	"""Tests for Parser class."""
 
@@ -50,24 +111,28 @@ def test_simple_function_no_args(self):
 	def test_function_with_single_arg(self):
 		parser = Parser("func(arg1)")
 		result = parser.parse()
-		assert result == FunctionCall("func", ["arg1"])
+		assert result == FunctionCall("func", [StringLiteral("arg1")])
 
 	def test_function_with_multiple_args(self):
 		parser = Parser("func(arg1, arg2, arg3)")
 		result = parser.parse()
-		assert result == FunctionCall("func", ["arg1", "arg2", "arg3"])
+		assert result == FunctionCall("func", [
+			StringLiteral("arg1"),
+			StringLiteral("arg2"),
+			StringLiteral("arg3")
+		])
 
 	def test_function_with_numeric_args(self):
 		parser = Parser("add(123, 456)")
 		result = parser.parse()
-		assert result == FunctionCall("add", ["123", "456"])
+		assert result == FunctionCall("add", [StringLiteral("123"), StringLiteral("456")])
 
 	def test_function_with_nested_function_call(self):
 		parser = Parser("func(nested(inner), arg2)")
 		result = parser.parse()
 		expected = FunctionCall("func", [
-			FunctionCall("nested", ["inner"]),
-			"arg2"
+			FunctionCall("nested", [StringLiteral("inner")]),
+			StringLiteral("arg2")
 		])
 		assert result == expected
 
@@ -75,30 +140,33 @@ def test_function_with_deeply_nested_function_calls(self):
 		parser = Parser("func(a(b(c)), d)")
 		result = parser.parse()
 		expected = FunctionCall("func", [
-			FunctionCall("a", [FunctionCall("b", ["c"])]),
-			"d"
+			FunctionCall("a", [FunctionCall("b", [StringLiteral("c")])]),
+			StringLiteral("d")
 		])
 		assert result == expected
 
 	def test_function_with_spaces(self):
 		parser = Parser("func( arg1 , arg2 )")
 		result = parser.parse()
-		assert result == FunctionCall("func", ["arg1", "arg2"])
+		assert result == FunctionCall("func", [
+			StringLiteral("arg1"),
+			StringLiteral("arg2")
+		])
 
 	def test_function_with_leading_trailing_spaces(self):
 		parser = Parser("  func(arg)  ")
 		result = parser.parse()
-		assert result == FunctionCall("func", ["arg"])
+		assert result == FunctionCall("func", [StringLiteral("arg")])
 
 	def test_function_with_underscore_in_name(self):
 		parser = Parser("my_func(arg)")
 		result = parser.parse()
-		assert result == FunctionCall("my_func", ["arg"])
+		assert result == FunctionCall("my_func", [StringLiteral("arg")])
 
 	def test_function_with_numbers_in_name(self):
 		parser = Parser("func123(arg)")
 		result = parser.parse()
-		assert result == FunctionCall("func123", ["arg"])
+		assert result == FunctionCall("func123", [StringLiteral("arg")])
 
 	def test_empty_string_raises_error(self):
 		parser = Parser("")
@@ -124,15 +192,19 @@ def test_function_with_empty_arg_between_commas(self):
 		parser = Parser("func(arg1, , arg2)")
 		result = parser.parse()
 		# Empty string is a valid argument
-		assert result == FunctionCall("func", ["arg1", "", "arg2"])
+		assert result == FunctionCall("func", [
+			StringLiteral("arg1"),
+			"",
+			StringLiteral("arg2")
+		])
 
 	def test_complex_nested_example(self):
 		parser = Parser("outer(inner1(a, b), inner2(c), d)")
 		result = parser.parse()
 		expected = FunctionCall("outer", [
-			FunctionCall("inner1", ["a", "b"]),
-			FunctionCall("inner2", ["c"]),
-			"d"
+			FunctionCall("inner1", [StringLiteral("a"), StringLiteral("b")]),
+			FunctionCall("inner2", [StringLiteral("c")]),
+			StringLiteral("d")
 		])
 		assert result == expected
 
@@ -150,7 +222,7 @@ def test_multiple_nested_levels(self):
 					FunctionCall("f4", [])
 				])
 			]),
-			"x"
+			StringLiteral("x")
 		])
 		assert result == expected
 
@@ -174,9 +246,9 @@ def test_nested_with_mixed_args(self):
 		parser = Parser("outer(x, inner(y), z)")
 		result = parser.parse()
 		expected = FunctionCall("outer", [
-			"x",
-			FunctionCall("inner", ["y"]),
-			"z"
+			StringLiteral("x"),
+			FunctionCall("inner", [StringLiteral("y")]),
+			StringLiteral("z")
 		])
 		assert result == expected
 
@@ -185,9 +257,51 @@ def test_deeply_nested_with_multiple_args(self):
 		result = parser.parse()
 		expected = FunctionCall("a", [
 			FunctionCall("b", [
-				FunctionCall("c", ["d", "e"]),
-				"f"
+				FunctionCall("c", [StringLiteral("d"), StringLiteral("e")]),
+				StringLiteral("f")
 			]),
-			"g"
+			StringLiteral("g")
+		])
+		assert result == expected
+
+	def test_string_literal_starts_with_number(self):
+		# Numbers at start mean it's not a valid identifier, so it's a plain arg
+		parser = Parser("func(123abc)")
+		result = parser.parse()
+		assert result == FunctionCall("func", [StringLiteral("123abc")])
+
+	def test_all_string_literals_in_complex_expr(self):
+		parser = Parser("and(or(a, b), not(c))")
+		result = parser.parse()
+		expected = FunctionCall("and", [
+			FunctionCall("or", [StringLiteral("a"), StringLiteral("b")]),
+			FunctionCall("not", [StringLiteral("c")])
 		])
-		assert result == expected
\ No newline at end of file
+		assert result == expected
+
+
+@dataclass
+class FakeItem:
+	k: str
+	v: str = "default"
+
+
+class TestTransformer:
+	"""Tests for Transformer class."""
+
+	def test_simple_function(self):
+		assert transformer.transform(FunctionCall("NOT", [StringLiteral("x")])) == logic.Not_("x")
+
+	def test_variadic_function(self):
+		assert transformer.transform(FunctionCall("AND", [StringLiteral("a"), StringLiteral("b"), StringLiteral("c")])) == logic.And_(["a", "b", "c"])
+
+	def test_multiple_args(self):
+		assert transformer.transform(FunctionCall("MATCH", [StringLiteral("k"), StringLiteral("v")])) == logic.TagMatch("k", "v")
+
+	def test_multiple_with_default(self):
+		assert TokenTransformer({
+			"TEST": TokenTransformation("TEST", FakeItem, ["k", "v"])
+		}).transform(FunctionCall("TEST", [StringLiteral("k")])) == FakeItem("k")
+
+	def test_recursive(self):
+		assert transformer.transform(FunctionCall("AND", [FunctionCall("NOT", [StringLiteral("x")])])) == logic.And_([logic.Not_("x")])
\ No newline at end of file

From fc799ff97a48e15d514cb1830ac18051034d3aa2 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 16:51:04 -0500
Subject: [PATCH 06/15] feature: add Regex literals and allow symbols in
 literals

---
 alpacloud/eztag/parser.py      | 20 +++++++++++++++++---
 alpacloud/eztag/parser_test.py | 14 ++++++++++++--
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 70fabc7..614dfbc 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -43,7 +43,13 @@ class StringLiteral:
 	value: str
 
 
+@dataclass
+class RegexLiteral:
+	value: str
+
 class Parser:
+	reserved_chars = set("(),/")
+
 	def __init__(self, text: str):
 		self.state = ParseState(text.strip())
 
@@ -68,7 +74,7 @@ def _parse_function_call(self) -> FunctionCall:
 		return FunctionCall(name, args)
 
 	def _parse_identifier(self) -> str:
-		return self.state.consume_while(lambda c: c.isalnum() or c == '_')
+		return self.state.consume_while(lambda c: c not in self.reserved_chars and not c.isspace())
 
 	def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
 		args = []
@@ -78,8 +84,10 @@ def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
 			if self.state.peek() == ')':
 				break
 
-			arg = self._parse_argument()
-			args.append(arg)
+			if self.state.peek() == '/':
+				args.append(self._parse_regex())
+			else:
+				args.append(self._parse_argument())
 
 			self.state.consume_while(str.isspace)
 			if self.state.peek() == ',':
@@ -89,6 +97,12 @@ def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
 
 		return args
 
+	def _parse_regex(self) -> RegexLiteral:
+		self.state.consume()
+		v = RegexLiteral(self.state.consume_while(lambda c: c != '/'))
+		self.state.consume()
+		return v
+
 	def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
 		self.state.consume_while(str.isspace)
 		
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index c6550ea..e4ecdc7 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -3,7 +3,7 @@
 import pytest
 
 from alpacloud.eztag import logic
-from alpacloud.eztag.parser import Parser, FunctionCall, ParseState, StringLiteral, transformer, TokenTransformation, TokenTransformer
+from alpacloud.eztag.parser import Parser, FunctionCall, ParseState, StringLiteral, transformer, TokenTransformation, TokenTransformer, RegexLiteral
 
 
 class TestParseState:
@@ -211,7 +211,7 @@ def test_complex_nested_example(self):
 	def test_function_with_special_chars_in_args(self):
 		parser = Parser("func(arg-1, arg.2, arg@3)")
 		result = parser.parse()
-		assert result == FunctionCall("func", ["arg-1", "arg.2", "arg@3"])
+		assert result == FunctionCall("func", [StringLiteral(value='arg-1'), StringLiteral(value='arg.2'), StringLiteral(value='arg@3')])
 
 	def test_multiple_nested_levels(self):
 		parser = Parser("f1(f2(f3(f4())), x)")
@@ -279,6 +279,16 @@ def test_all_string_literals_in_complex_expr(self):
 		])
 		assert result == expected
 
+	def test_regex_literal(self):
+		parser = Parser("match(k, /v/)")
+		result = parser.parse()
+		assert result == FunctionCall("match", [StringLiteral("k"), RegexLiteral("v")])
+
+	def test_regex_literal_with_nesting(self):
+		parser = Parser("match(k, /match(k, v)/)")
+		result = parser.parse()
+		assert result == FunctionCall("match", [StringLiteral("k"), RegexLiteral("match(k, v)")])
+
 
 @dataclass
 class FakeItem:

From 44e3d3ee3c1f67f2985b1433a06c02e4109ac5df Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 16:51:25 -0500
Subject: [PATCH 07/15] task: lint

---
 alpacloud/eztag/parser.py      |  78 +++++++++++++-----------
 alpacloud/eztag/parser_test.py | 105 +++++++--------------------------
 2 files changed, 64 insertions(+), 119 deletions(-)

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 614dfbc..59869a7 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -1,5 +1,5 @@
 from dataclasses import dataclass
-from typing import List, Optional, Union, Literal
+from typing import List, Literal, Optional, Union
 
 from alpacloud.eztag import logic
 from alpacloud.eztag.logic import Exp
@@ -24,7 +24,7 @@ def consume_while(self, predicate) -> str:
 		result = []
 		while self.peek() and predicate(self.peek()):
 			result.append(self.consume())
-		return ''.join(result)
+		return "".join(result)
 
 
 @dataclass
@@ -35,7 +35,7 @@ class StringLiteral:
 @dataclass
 class FunctionCall:
 	name: str
-	args: List[Union[str, StringLiteral, 'FunctionCall']]
+	args: List[Union[str, StringLiteral, "FunctionCall"]]
 
 
 @dataclass
@@ -47,6 +47,7 @@ class StringLiteral:
 class RegexLiteral:
 	value: str
 
+
 class Parser:
 	reserved_chars = set("(),/")
 
@@ -61,13 +62,13 @@ def _parse_function_call(self) -> FunctionCall:
 		if not name:
 			raise ValueError("Expected function name")
 
-		if self.state.peek() != '(':
+		if self.state.peek() != "(":
 			raise ValueError("Expected opening parenthesis")
 		self.state.consume()  # consume '('
 
 		args = self._parse_arguments()
 
-		if self.state.peek() != ')':
+		if self.state.peek() != ")":
 			raise ValueError("Expected closing parenthesis")
 		self.state.consume()  # consume ')'
 
@@ -81,36 +82,36 @@ def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
 		while True:
 			self.state.consume_while(str.isspace)
 
-			if self.state.peek() == ')':
+			if self.state.peek() == ")":
 				break
 
-			if self.state.peek() == '/':
+			if self.state.peek() == "/":
 				args.append(self._parse_regex())
 			else:
 				args.append(self._parse_argument())
 
 			self.state.consume_while(str.isspace)
-			if self.state.peek() == ',':
+			if self.state.peek() == ",":
 				self.state.consume()
-			elif self.state.peek() != ')':
+			elif self.state.peek() != ")":
 				raise ValueError("Expected comma or closing parenthesis")
 
 		return args
 
 	def _parse_regex(self) -> RegexLiteral:
 		self.state.consume()
-		v = RegexLiteral(self.state.consume_while(lambda c: c != '/'))
+		v = RegexLiteral(self.state.consume_while(lambda c: c != "/"))
 		self.state.consume()
 		return v
 
 	def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
 		self.state.consume_while(str.isspace)
-		
+
 		# Check if this argument is a function call or string literal
 		start_pos = self.state.pos
 		identifier = self._parse_identifier()
-		
-		if identifier and self.state.peek() == '(':
+
+		if identifier and self.state.peek() == "(":
 			# It's a nested function call - parse it recursively
 			self.state.pos = start_pos  # Reset position
 			return self._parse_function_call()
@@ -119,7 +120,7 @@ def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
 			# Check that we're at a valid stopping point
 			self.state.consume_while(str.isspace)
 			next_char = self.state.peek()
-			if next_char not in (',', ')', None):
+			if next_char not in (",", ")", None):
 				raise ValueError("Expected comma or closing parenthesis")
 			return StringLiteral(identifier)
 		else:
@@ -135,39 +136,39 @@ def _parse_plain_argument(self) -> str:
 		while self.state.peek():
 			char = self.state.peek()
 
-			if char == '(':
+			if char == "(":
 				depth += 1
-			elif char == ')':
+			elif char == ")":
 				if depth == 0:
 					break
 				depth -= 1
-			elif char == ',' and depth == 0:
+			elif char == "," and depth == 0:
 				break
 			elif str.isspace(char) and depth == 0 and has_content:
 				# Check if there's more non-whitespace content after this space
 				# Save position to potentially restore
 				space_start = self.state.pos
 				self.state.consume_while(str.isspace)
-				
+
 				# If we hit a comma or closing paren, the spaces are trailing - OK
-				if self.state.peek() in (',', ')', None):
+				if self.state.peek() in (",", ")", None):
 					break
-				
+
 				# Otherwise, there's more content after spaces without a comma - ERROR
 				# But we need to check if it's another identifier (which would be invalid)
 				next_char = self.state.peek()
-				if next_char and (next_char.isalnum() or next_char == '_'):
+				if next_char and (next_char.isalnum() or next_char == "_"):
 					raise ValueError("Expected comma or closing parenthesis")
-				
+
 				# Reset and continue consuming (for special chars in args)
 				self.state.pos = space_start
-			
+
 			if not str.isspace(char):
 				has_content = True
-			
+
 			result.append(self.state.consume())
 
-		return ''.join(result).strip()
+		return "".join(result).strip()
 
 
 @dataclass
@@ -176,6 +177,7 @@ class TokenTransformation:
 	function: type[Exp]
 	args: list[str] | Literal["variadic"]
 
+
 @dataclass
 class TokenTransformer:
 	transformations: dict[str, TokenTransformation]
@@ -192,14 +194,18 @@ def transform(self, token: FunctionCall | StringLiteral) -> Exp | str:
 			kwargs = {k: self.transform(v) for k, v in raw_kwargs.items()}
 			return transformer.function(**kwargs)
 
-transformer = TokenTransformer({
-	e.name:e for e in [
-		TokenTransformation("NOT", logic.Not_, ["cond"]),
-		TokenTransformation("AND", logic.And_, "variadic"),
-		TokenTransformation("OR", logic.Or_, "variadic"),
-		TokenTransformation("HAS", logic.TagHas, ["k"]),
-		TokenTransformation("MATCH", logic.TagMatch, ["k", "v"]),
-		TokenTransformation("RE", logic.TagRematch, ["k", "v"]),
-		TokenTransformation("CONTAINS", logic.TagContains, ["k", "v"]),
-	]
-})
\ No newline at end of file
+
+transformer = TokenTransformer(
+	{
+		e.name: e
+		for e in [
+			TokenTransformation("NOT", logic.Not_, ["cond"]),
+			TokenTransformation("AND", logic.And_, "variadic"),
+			TokenTransformation("OR", logic.Or_, "variadic"),
+			TokenTransformation("HAS", logic.TagHas, ["k"]),
+			TokenTransformation("MATCH", logic.TagMatch, ["k", "v"]),
+			TokenTransformation("RE", logic.TagRematch, ["k", "v"]),
+			TokenTransformation("CONTAINS", logic.TagContains, ["k", "v"]),
+		]
+	}
+)
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index e4ecdc7..c92888d 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -3,7 +3,7 @@
 import pytest
 
 from alpacloud.eztag import logic
-from alpacloud.eztag.parser import Parser, FunctionCall, ParseState, StringLiteral, transformer, TokenTransformation, TokenTransformer, RegexLiteral
+from alpacloud.eztag.parser import FunctionCall, Parser, ParseState, RegexLiteral, StringLiteral, TokenTransformation, TokenTransformer, transformer
 
 
 class TestParseState:
@@ -11,7 +11,7 @@ class TestParseState:
 
 	def test_peek_at_beginning(self):
 		state = ParseState("hello")
-		assert state.peek() == 'h'
+		assert state.peek() == "h"
 		assert state.pos == 0  # peek doesn't advance
 
 	def test_peek_at_end(self):
@@ -20,9 +20,9 @@ def test_peek_at_end(self):
 
 	def test_consume_advances_position(self):
 		state = ParseState("hello")
-		assert state.consume() == 'h'
+		assert state.consume() == "h"
 		assert state.pos == 1
-		assert state.consume() == 'e'
+		assert state.consume() == "e"
 		assert state.pos == 2
 
 	def test_consume_at_end_returns_none(self):
@@ -53,11 +53,7 @@ def test_single_string_literal(self):
 	def test_multiple_string_literals(self):
 		parser = Parser("func(arg1, arg2, arg3)")
 		result = parser.parse()
-		assert result == FunctionCall("func", [
-			StringLiteral("arg1"),
-			StringLiteral("arg2"),
-			StringLiteral("arg3")
-		])
+		assert result == FunctionCall("func", [StringLiteral("arg1"), StringLiteral("arg2"), StringLiteral("arg3")])
 
 	def test_string_literal_with_numbers(self):
 		parser = Parser("func(arg123)")
@@ -77,27 +73,17 @@ def test_string_literal_with_spaces(self):
 	def test_mixed_string_literals_and_function_calls(self):
 		parser = Parser("func(arg1, nested(), arg2)")
 		result = parser.parse()
-		assert result == FunctionCall("func", [
-			StringLiteral("arg1"),
-			FunctionCall("nested", []),
-			StringLiteral("arg2")
-		])
+		assert result == FunctionCall("func", [StringLiteral("arg1"), FunctionCall("nested", []), StringLiteral("arg2")])
 
 	def test_string_literal_in_nested_function(self):
 		parser = Parser("outer(inner(literal))")
 		result = parser.parse()
-		assert result == FunctionCall("outer", [
-			FunctionCall("inner", [StringLiteral("literal")])
-		])
+		assert result == FunctionCall("outer", [FunctionCall("inner", [StringLiteral("literal")])])
 
 	def test_multiple_string_literals_nested(self):
 		parser = Parser("func(a, b(c, d), e)")
 		result = parser.parse()
-		assert result == FunctionCall("func", [
-			StringLiteral("a"),
-			FunctionCall("b", [StringLiteral("c"), StringLiteral("d")]),
-			StringLiteral("e")
-		])
+		assert result == FunctionCall("func", [StringLiteral("a"), FunctionCall("b", [StringLiteral("c"), StringLiteral("d")]), StringLiteral("e")])
 
 
 class TestParser:
@@ -116,11 +102,7 @@ def test_function_with_single_arg(self):
 	def test_function_with_multiple_args(self):
 		parser = Parser("func(arg1, arg2, arg3)")
 		result = parser.parse()
-		assert result == FunctionCall("func", [
-			StringLiteral("arg1"),
-			StringLiteral("arg2"),
-			StringLiteral("arg3")
-		])
+		assert result == FunctionCall("func", [StringLiteral("arg1"), StringLiteral("arg2"), StringLiteral("arg3")])
 
 	def test_function_with_numeric_args(self):
 		parser = Parser("add(123, 456)")
@@ -130,28 +112,19 @@ def test_function_with_numeric_args(self):
 	def test_function_with_nested_function_call(self):
 		parser = Parser("func(nested(inner), arg2)")
 		result = parser.parse()
-		expected = FunctionCall("func", [
-			FunctionCall("nested", [StringLiteral("inner")]),
-			StringLiteral("arg2")
-		])
+		expected = FunctionCall("func", [FunctionCall("nested", [StringLiteral("inner")]), StringLiteral("arg2")])
 		assert result == expected
 
 	def test_function_with_deeply_nested_function_calls(self):
 		parser = Parser("func(a(b(c)), d)")
 		result = parser.parse()
-		expected = FunctionCall("func", [
-			FunctionCall("a", [FunctionCall("b", [StringLiteral("c")])]),
-			StringLiteral("d")
-		])
+		expected = FunctionCall("func", [FunctionCall("a", [FunctionCall("b", [StringLiteral("c")])]), StringLiteral("d")])
 		assert result == expected
 
 	def test_function_with_spaces(self):
 		parser = Parser("func( arg1 , arg2 )")
 		result = parser.parse()
-		assert result == FunctionCall("func", [
-			StringLiteral("arg1"),
-			StringLiteral("arg2")
-		])
+		assert result == FunctionCall("func", [StringLiteral("arg1"), StringLiteral("arg2")])
 
 	def test_function_with_leading_trailing_spaces(self):
 		parser = Parser("  func(arg)  ")
@@ -192,38 +165,23 @@ def test_function_with_empty_arg_between_commas(self):
 		parser = Parser("func(arg1, , arg2)")
 		result = parser.parse()
 		# Empty string is a valid argument
-		assert result == FunctionCall("func", [
-			StringLiteral("arg1"),
-			"",
-			StringLiteral("arg2")
-		])
+		assert result == FunctionCall("func", [StringLiteral("arg1"), "", StringLiteral("arg2")])
 
 	def test_complex_nested_example(self):
 		parser = Parser("outer(inner1(a, b), inner2(c), d)")
 		result = parser.parse()
-		expected = FunctionCall("outer", [
-			FunctionCall("inner1", [StringLiteral("a"), StringLiteral("b")]),
-			FunctionCall("inner2", [StringLiteral("c")]),
-			StringLiteral("d")
-		])
+		expected = FunctionCall("outer", [FunctionCall("inner1", [StringLiteral("a"), StringLiteral("b")]), FunctionCall("inner2", [StringLiteral("c")]), StringLiteral("d")])
 		assert result == expected
 
 	def test_function_with_special_chars_in_args(self):
 		parser = Parser("func(arg-1, arg.2, arg@3)")
 		result = parser.parse()
-		assert result == FunctionCall("func", [StringLiteral(value='arg-1'), StringLiteral(value='arg.2'), StringLiteral(value='arg@3')])
+		assert result == FunctionCall("func", [StringLiteral(value="arg-1"), StringLiteral(value="arg.2"), StringLiteral(value="arg@3")])
 
 	def test_multiple_nested_levels(self):
 		parser = Parser("f1(f2(f3(f4())), x)")
 		result = parser.parse()
-		expected = FunctionCall("f1", [
-			FunctionCall("f2", [
-				FunctionCall("f3", [
-					FunctionCall("f4", [])
-				])
-			]),
-			StringLiteral("x")
-		])
+		expected = FunctionCall("f1", [FunctionCall("f2", [FunctionCall("f3", [FunctionCall("f4", [])])]), StringLiteral("x")])
 		assert result == expected
 
 	def test_nested_function_with_no_args(self):
@@ -235,33 +193,19 @@ def test_nested_function_with_no_args(self):
 	def test_multiple_nested_functions_as_args(self):
 		parser = Parser("func(a(), b(), c())")
 		result = parser.parse()
-		expected = FunctionCall("func", [
-			FunctionCall("a", []),
-			FunctionCall("b", []),
-			FunctionCall("c", [])
-		])
+		expected = FunctionCall("func", [FunctionCall("a", []), FunctionCall("b", []), FunctionCall("c", [])])
 		assert result == expected
 
 	def test_nested_with_mixed_args(self):
 		parser = Parser("outer(x, inner(y), z)")
 		result = parser.parse()
-		expected = FunctionCall("outer", [
-			StringLiteral("x"),
-			FunctionCall("inner", [StringLiteral("y")]),
-			StringLiteral("z")
-		])
+		expected = FunctionCall("outer", [StringLiteral("x"), FunctionCall("inner", [StringLiteral("y")]), StringLiteral("z")])
 		assert result == expected
 
 	def test_deeply_nested_with_multiple_args(self):
 		parser = Parser("a(b(c(d, e), f), g)")
 		result = parser.parse()
-		expected = FunctionCall("a", [
-			FunctionCall("b", [
-				FunctionCall("c", [StringLiteral("d"), StringLiteral("e")]),
-				StringLiteral("f")
-			]),
-			StringLiteral("g")
-		])
+		expected = FunctionCall("a", [FunctionCall("b", [FunctionCall("c", [StringLiteral("d"), StringLiteral("e")]), StringLiteral("f")]), StringLiteral("g")])
 		assert result == expected
 
 	def test_string_literal_starts_with_number(self):
@@ -273,10 +217,7 @@ def test_string_literal_starts_with_number(self):
 	def test_all_string_literals_in_complex_expr(self):
 		parser = Parser("and(or(a, b), not(c))")
 		result = parser.parse()
-		expected = FunctionCall("and", [
-			FunctionCall("or", [StringLiteral("a"), StringLiteral("b")]),
-			FunctionCall("not", [StringLiteral("c")])
-		])
+		expected = FunctionCall("and", [FunctionCall("or", [StringLiteral("a"), StringLiteral("b")]), FunctionCall("not", [StringLiteral("c")])])
 		assert result == expected
 
 	def test_regex_literal(self):
@@ -309,9 +250,7 @@ def test_multiple_args(self):
 		assert transformer.transform(FunctionCall("MATCH", [StringLiteral("k"), StringLiteral("v")])) == logic.TagMatch("k", "v")
 
 	def test_multiple_with_default(self):
-		assert TokenTransformer({
-			"TEST": TokenTransformation("TEST", FakeItem, ["k", "v"])
-		}).transform(FunctionCall("TEST", [StringLiteral("k")])) == FakeItem("k")
+		assert TokenTransformer({"TEST": TokenTransformation("TEST", FakeItem, ["k", "v"])}).transform(FunctionCall("TEST", [StringLiteral("k")])) == FakeItem("k")
 
 	def test_recursive(self):
-		assert transformer.transform(FunctionCall("AND", [FunctionCall("NOT", [StringLiteral("x")])])) == logic.And_([logic.Not_("x")])
\ No newline at end of file
+		assert transformer.transform(FunctionCall("AND", [FunctionCall("NOT", [StringLiteral("x")])])) == logic.And_([logic.Not_("x")])

From 135490d3a7c015fea58a41d4d303b5aa10d8f147 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 16 Nov 2025 17:31:03 -0500
Subject: [PATCH 08/15] task: typecheck and cull dead branch

---
 alpacloud/eztag/logic.py       |   2 +-
 alpacloud/eztag/multidict.py   |  17 +++---
 alpacloud/eztag/parser.py      | 103 +++++++++++----------------------
 alpacloud/eztag/parser_test.py |   5 +-
 4 files changed, 46 insertions(+), 81 deletions(-)

diff --git a/alpacloud/eztag/logic.py b/alpacloud/eztag/logic.py
index ee32910..9b67956 100644
--- a/alpacloud/eztag/logic.py
+++ b/alpacloud/eztag/logic.py
@@ -65,7 +65,7 @@ def check(self, tags: TagSet) -> bool:
 @dataclass(frozen=True, slots=True)
 class TagRematch(Exp):
 	k: str
-	v: str | None
+	v: str
 
 	def check(self, tags: TagSet) -> bool:
 		return tags.rematch(self.k, self.v)
diff --git a/alpacloud/eztag/multidict.py b/alpacloud/eztag/multidict.py
index 30f5d1b..7af3087 100644
--- a/alpacloud/eztag/multidict.py
+++ b/alpacloud/eztag/multidict.py
@@ -1,10 +1,12 @@
-from typing import Iterable, TypeAlias
+from __future__ import annotations
+
+from typing import Iterable, TypeAlias, TypeGuard
 
 K: TypeAlias = str
 V: TypeAlias = str | None
 
 
-def _is_collection(obj):
+def _is_collection(obj) -> TypeGuard[Iterable]:
 	"""
 	Checks if an object is an iterable collection, excluding strings and bytes.
 	"""
@@ -21,28 +23,29 @@ def __init__(self):
 		self.d: dict[K, set[V]] = {}
 
 	@classmethod
-	def from_dict(cls, d: dict[K, V]):
+	def from_dict(cls, d: dict[K, V]) -> MultiDict:
 		md = cls()
 		for k, v in d.items():
 			md[k] = {v}
 		return md
 
 	@classmethod
-	def create(cls, d: dict[K, Iterable[V] | V]):
+	def create(cls, d: dict[K, Iterable[V] | V]) -> MultiDict:
 		md = cls()
 		for k, vs in d.items():
+			n: set[V]
 			if not _is_collection(vs):
-				n = {vs}
+				n = {vs}  # type: ignore # idk typeguard
 			else:
 				n = set(vs)
 			md.d[k] = n
 		return md
 
-	def __getitem__(self, key):
+	def __getitem__(self, key) -> set[V]:
 		return self.d[key]
 
 	def __setitem__(self, key, value):
 		self.d.setdefault(key, set()).add(value)
 
-	def __contains__(self, key):
+	def __contains__(self, key) -> bool:
 		return key in self.d
diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 59869a7..2cf3f01 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -1,5 +1,6 @@
+import abc
 from dataclasses import dataclass
-from typing import List, Literal, Optional, Union
+from typing import List, Literal, Optional
 
 from alpacloud.eztag import logic
 from alpacloud.eztag.logic import Exp
@@ -23,28 +24,29 @@ def consume(self) -> Optional[str]:
 	def consume_while(self, predicate) -> str:
 		result = []
 		while self.peek() and predicate(self.peek()):
-			result.append(self.consume())
+			next_result = self.consume()
+			if next_result is not None:
+				result.append(next_result)
 		return "".join(result)
 
 
-@dataclass
-class StringLiteral:
-	value: str
+class ASTNode(abc.ABC):
+	pass
 
 
 @dataclass
-class FunctionCall:
-	name: str
-	args: List[Union[str, StringLiteral, "FunctionCall"]]
+class StringLiteral(ASTNode):
+	value: str
 
 
 @dataclass
-class StringLiteral:
-	value: str
+class FunctionCall(ASTNode):
+	name: str
+	args: List[ASTNode]
 
 
 @dataclass
-class RegexLiteral:
+class RegexLiteral(ASTNode):
 	value: str
 
 
@@ -77,8 +79,8 @@ def _parse_function_call(self) -> FunctionCall:
 	def _parse_identifier(self) -> str:
 		return self.state.consume_while(lambda c: c not in self.reserved_chars and not c.isspace())
 
-	def _parse_arguments(self) -> List[Union[str, StringLiteral, FunctionCall]]:
-		args = []
+	def _parse_arguments(self) -> List[ASTNode]:
+		args: List[ASTNode] = []
 		while True:
 			self.state.consume_while(str.isspace)
 
@@ -104,7 +106,7 @@ def _parse_regex(self) -> RegexLiteral:
 		self.state.consume()
 		return v
 
-	def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
+	def _parse_argument(self) -> ASTNode:
 		self.state.consume_while(str.isspace)
 
 		# Check if this argument is a function call or string literal
@@ -124,51 +126,7 @@ def _parse_argument(self) -> Union[str, StringLiteral, FunctionCall]:
 				raise ValueError("Expected comma or closing parenthesis")
 			return StringLiteral(identifier)
 		else:
-			# It's a plain argument - reset and parse as string
-			self.state.pos = start_pos
-			return self._parse_plain_argument()
-
-	def _parse_plain_argument(self) -> str:
-		depth = 0
-		result = []
-		has_content = False
-
-		while self.state.peek():
-			char = self.state.peek()
-
-			if char == "(":
-				depth += 1
-			elif char == ")":
-				if depth == 0:
-					break
-				depth -= 1
-			elif char == "," and depth == 0:
-				break
-			elif str.isspace(char) and depth == 0 and has_content:
-				# Check if there's more non-whitespace content after this space
-				# Save position to potentially restore
-				space_start = self.state.pos
-				self.state.consume_while(str.isspace)
-
-				# If we hit a comma or closing paren, the spaces are trailing - OK
-				if self.state.peek() in (",", ")", None):
-					break
-
-				# Otherwise, there's more content after spaces without a comma - ERROR
-				# But we need to check if it's another identifier (which would be invalid)
-				next_char = self.state.peek()
-				if next_char and (next_char.isalnum() or next_char == "_"):
-					raise ValueError("Expected comma or closing parenthesis")
-
-				# Reset and continue consuming (for special chars in args)
-				self.state.pos = space_start
-
-			if not str.isspace(char):
-				has_content = True
-
-			result.append(self.state.consume())
-
-		return "".join(result).strip()
+			raise ValueError("Expected identifier")
 
 
 @dataclass
@@ -182,17 +140,22 @@ class TokenTransformation:
 class TokenTransformer:
 	transformations: dict[str, TokenTransformation]
 
-	def transform(self, token: FunctionCall | StringLiteral) -> Exp | str:
-		if isinstance(token, StringLiteral):
-			return token.value
-
-		transformer = self.transformations[token.name]
-		if transformer.args == "variadic":
-			return transformer.function([self.transform(e) for e in token.args])
-		else:
-			raw_kwargs = dict(zip(transformer.args, token.args))
-			kwargs = {k: self.transform(v) for k, v in raw_kwargs.items()}
-			return transformer.function(**kwargs)
+	def transform(self, token: ASTNode) -> Exp | str:
+		match token:
+			case StringLiteral():
+				return token.value
+			case RegexLiteral():
+				return token.value
+			case FunctionCall():
+				transformer = self.transformations[token.name]
+				if transformer.args == "variadic":
+					return transformer.function([self.transform(e) for e in token.args])  # type: ignore # the typesafety is done by the TokenTransformation
+				else:
+					raw_kwargs = dict(zip(transformer.args, token.args))
+					kwargs = {k: self.transform(v) for k, v in raw_kwargs.items()}
+					return transformer.function(**kwargs)
+			case _:
+				raise ValueError(f"Unexpected token: {token} of type {type(token)}")
 
 
 transformer = TokenTransformer(
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index c92888d..259b8e1 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -163,9 +163,8 @@ def test_missing_comma_between_args_raises_error(self):
 
 	def test_function_with_empty_arg_between_commas(self):
 		parser = Parser("func(arg1, , arg2)")
-		result = parser.parse()
-		# Empty string is a valid argument
-		assert result == FunctionCall("func", [StringLiteral("arg1"), "", StringLiteral("arg2")])
+		with pytest.raises(ValueError, match="Expected identifier"):
+			parser.parse()
 
 	def test_complex_nested_example(self):
 		parser = Parser("outer(inner1(a, b), inner2(c), d)")

From b52209c0e3896d6929c70ce9c2ec5d18a2e00d59 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 23 Nov 2025 23:33:02 -0500
Subject: [PATCH 09/15] task: rename Exp -> Expr

---
 alpacloud/eztag/logic.py  | 18 +++++++++---------
 alpacloud/eztag/parser.py |  8 +++++---
 2 files changed, 14 insertions(+), 12 deletions(-)

diff --git a/alpacloud/eztag/logic.py b/alpacloud/eztag/logic.py
index 9b67956..6f4a6c4 100644
--- a/alpacloud/eztag/logic.py
+++ b/alpacloud/eztag/logic.py
@@ -5,7 +5,7 @@
 from alpacloud.eztag.tag import TagSet
 
 
-class Exp(ABC):
+class Expr(ABC):
 	"""A predicate"""
 
 	def check(self, tags: TagSet) -> bool:
@@ -14,7 +14,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class Cond_(Exp):
+class Cond_(Expr):
 	f: Callable[[TagSet], bool]
 
 	def check(self, tags: TagSet) -> bool:
@@ -22,7 +22,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class And_(Exp):
+class And_(Expr):
 	conds: list[Cond_]
 
 	def check(self, tags: TagSet) -> bool:
@@ -30,7 +30,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class Or_(Exp):
+class Or_(Expr):
 	conds: list[Cond_]
 
 	def check(self, tags: TagSet) -> bool:
@@ -38,7 +38,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class Not_(Exp):
+class Not_(Expr):
 	cond: Cond_
 
 	def check(self, tags: TagSet) -> bool:
@@ -46,7 +46,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class TagHas(Exp):
+class TagHas(Expr):
 	k: str
 
 	def check(self, tags: TagSet) -> bool:
@@ -54,7 +54,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class TagMatch(Exp):
+class TagMatch(Expr):
 	k: str
 	v: str | None
 
@@ -63,7 +63,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class TagRematch(Exp):
+class TagRematch(Expr):
 	k: str
 	v: str
 
@@ -72,7 +72,7 @@ def check(self, tags: TagSet) -> bool:
 
 
 @dataclass(frozen=True, slots=True)
-class TagContains(Exp):
+class TagContains(Expr):
 	k: str
 	v: str
 
diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 2cf3f01..ecdbce2 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -1,9 +1,11 @@
+from __future__ import annotations
+
 import abc
 from dataclasses import dataclass
 from typing import List, Literal, Optional
 
 from alpacloud.eztag import logic
-from alpacloud.eztag.logic import Exp
+from alpacloud.eztag.logic import Expr
 
 
 @dataclass
@@ -132,7 +134,7 @@ def _parse_argument(self) -> ASTNode:
 @dataclass
 class TokenTransformation:
 	name: str
-	function: type[Exp]
+	function: type[Expr]
 	args: list[str] | Literal["variadic"]
 
 
@@ -140,7 +142,7 @@ class TokenTransformation:
 class TokenTransformer:
 	transformations: dict[str, TokenTransformation]
 
-	def transform(self, token: ASTNode) -> Exp | str:
+	def transform(self, token: ASTNode) -> Expr | str:
 		match token:
 			case StringLiteral():
 				return token.value

From 13aead88f663db41f908c182e8831841d1c145ab Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 23 Nov 2025 23:33:26 -0500
Subject: [PATCH 10/15] feature: add selector for externally-tagged items

---
 alpacloud/eztag/selector.py | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)
 create mode 100644 alpacloud/eztag/selector.py

diff --git a/alpacloud/eztag/selector.py b/alpacloud/eztag/selector.py
new file mode 100644
index 0000000..3f78f79
--- /dev/null
+++ b/alpacloud/eztag/selector.py
@@ -0,0 +1,18 @@
+from typing import TypeVar
+
+from alpacloud.eztag.logic import Expr
+from alpacloud.eztag.tag import TagSet
+
+Data = TypeVar("Data")
+
+class Selector:
+	"""Select items based on their tags"""
+
+	def __init__(self, items: list[tuple[TagSet, Data]]):
+		self.items = items
+
+	def select(self, expr: Expr) -> list[Data]:
+		return [e[1] for e in self.select_with_tags(expr)]
+
+	def select_with_tags(self, expr: Expr) -> list[tuple[TagSet, Data]]:
+		return [e for e in self.items if expr.check(e[0])]

From c3132dbc211ce9a2ddf410ac2d808e51054cb66d Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 23 Nov 2025 23:33:58 -0500
Subject: [PATCH 11/15] feature: allow token case-insensitivity

---
 alpacloud/eztag/parser.py | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index ecdbce2..653bd03 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -138,9 +138,13 @@ class TokenTransformation:
 	args: list[str] | Literal["variadic"]
 
 
-@dataclass
 class TokenTransformer:
-	transformations: dict[str, TokenTransformation]
+	def __init__(self, transformations: dict[str, TokenTransformation], case_sensitive_tokens: bool = False):
+		self.case_sensitive_tokens = case_sensitive_tokens
+		if case_sensitive_tokens:
+			self.transformations = transformations
+		else:
+			self.transformations = {k.lower(): v for k, v in transformations.items()}
 
 	def transform(self, token: ASTNode) -> Expr | str:
 		match token:
@@ -149,7 +153,11 @@ def transform(self, token: ASTNode) -> Expr | str:
 			case RegexLiteral():
 				return token.value
 			case FunctionCall():
-				transformer = self.transformations[token.name]
+				if self.case_sensitive_tokens:
+					transformer = self.transformations[token.name]
+				else:
+					transformer = self.transformations[token.name.lower()]
+
 				if transformer.args == "variadic":
 					return transformer.function([self.transform(e) for e in token.args])  # type: ignore # the typesafety is done by the TokenTransformation
 				else:

From c4858309687a517c072c876d6df4b18f830029f8 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Sun, 23 Nov 2025 23:34:59 -0500
Subject: [PATCH 12/15] doc: add readme

---
 alpacloud/eztag/parser.py      | 11 +++++
 alpacloud/eztag/parser_test.py | 10 +++-
 alpacloud/eztag/readme.md      | 85 +++++++++++++++++++++++++++++++++-
 alpacloud/eztag/tag.py         | 10 +++-
 4 files changed, 113 insertions(+), 3 deletions(-)

diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 653bd03..8d0bccc 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -133,6 +133,14 @@ def _parse_argument(self) -> ASTNode:
 
 @dataclass
 class TokenTransformation:
+	"""
+	Associates the name of a function with the Expr implementing functionality.
+
+	The `args` field associates positional arguments in the raw filter expression with the function's keyword arguments.
+	For example, MATCH takes a key (k) and a value (v), so `args = ["k", "v"]`.
+	For functions that take a variable number of arguments, such as AND and OR, `args = "variadic"`.
+	"""
+
 	name: str
 	function: type[Expr]
 	args: list[str] | Literal["variadic"]
@@ -167,6 +175,9 @@ def transform(self, token: ASTNode) -> Expr | str:
 			case _:
 				raise ValueError(f"Unexpected token: {token} of type {type(token)}")
 
+	def extended(self, more_transformers: dict[str, TokenTransformation]) -> TokenTransformer:
+		return TokenTransformer(dict(**self.transformations, **more_transformers), self.case_sensitive_tokens)
+
 
 transformer = TokenTransformer(
 	{
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index 259b8e1..977d59d 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -3,6 +3,7 @@
 import pytest
 
 from alpacloud.eztag import logic
+from alpacloud.eztag.logic import TagRematch, TagMatch, And_
 from alpacloud.eztag.parser import FunctionCall, Parser, ParseState, RegexLiteral, StringLiteral, TokenTransformation, TokenTransformer, transformer
 
 
@@ -229,7 +230,6 @@ def test_regex_literal_with_nesting(self):
 		result = parser.parse()
 		assert result == FunctionCall("match", [StringLiteral("k"), RegexLiteral("match(k, v)")])
 
-
 @dataclass
 class FakeItem:
 	k: str
@@ -253,3 +253,11 @@ def test_multiple_with_default(self):
 
 	def test_recursive(self):
 		assert transformer.transform(FunctionCall("AND", [FunctionCall("NOT", [StringLiteral("x")])])) == logic.And_([logic.Not_("x")])
+
+
+class TestIntegration:
+	def test_example(self):
+
+		filter = "and(match(env, prd), re(name, /grafana.*/))"
+		result = transformer.transform(Parser(filter).parse())
+		assert result == And_(conds=[TagMatch(k='env', v='prd'), TagRematch(k='name', v='grafana.*')])
\ No newline at end of file
diff --git a/alpacloud/eztag/readme.md b/alpacloud/eztag/readme.md
index 916107b..b9f0c54 100644
--- a/alpacloud/eztag/readme.md
+++ b/alpacloud/eztag/readme.md
@@ -1,7 +1,16 @@
 # alpacloud.eztag
 
-`eztag` helps you easily filter things by tags. For example:
+`eztag` helps you easily filter things by tags.
+
+## Usage
+
+### Filtering in code
+
+You can directly invoke the filters as functions. For example:
+
 ```python
+from alpacloud.eztag.tag import TagSet
+
 @dataclass
 class Snippet:
     name: str
@@ -21,3 +30,77 @@ There are several filter functions available:
 - match : check if a TagSet has a key with a value
 - rematch : check if a TagSet has a key with a value that matches a regex
 - contains : check if a TagSet has a key whose value contains a substring
+
+### Filtering external data
+
+If your objects don't have tags, you can associate tag data with them using `Selector`:
+
+```python
+from alpacloud.eztag.logic import TagMatch
+from alpacloud.eztag.selector import Selector
+from alpacloud.eztag.tag import TagSet
+
+tasks = Selector([
+    (TagSet.from_dict({"env":"prd", "dangerous": "true"}), task0),
+    (TagSet.from_dict({"env":"stg", "dangerous": "false"}), task1),
+])
+
+dangerous_tasks = tasks.select(TagMatch("dangerous", "true"))
+```
+
+### Filtering from the CLI
+
+`eztag` allows you to input filters in a simple language from the CLI. You can build this filtering into your own tools.
+
+
+```python
+import click
+
+from alpacloud.eztag.parser import Parser, transformer
+from alpacloud.eztag.selector import Selector
+
+tagged_tasks = Selector(...)
+
+@click.command()
+@click.argument("filter")
+def cli(filter):
+    expr = transformer.transform(Parser(filter).parse())
+    selected_tasks = tagged_tasks.select(expr)
+
+    for task in selected_tasks:
+        task.run()
+```
+
+Then you can invoke it like this:
+```shell
+task-run --filter 'and(match(env, prd), re(name, /cert.*/)'
+```
+
+## Advanced usage
+
+### Adding custom filters or operators
+
+1. Implement your filter as a subclass of `alpacloud.eztag.logic.Expr`
+
+   ```python
+   from dataclasses import dataclass
+   from alpacloud.eztag.logic import Expr
+   
+   @dataclass(frozen=True)
+   class Shard(Expr):
+       """Run tasks with this shard identifier"""
+       shard: int
+   
+       def check(self, tags) -> bool:
+           return tags.contains("shard", str(self.shard))
+   ```
+   
+2. Register your filter in the `transformer` dictionary:
+
+   ```python
+   from alpacloud.eztag.transformer import transformer, TokenTransformer, TokenTransformation
+   
+   my_transformer = transformer.extended({
+       "SHARD": TokenTransformation("SHARD", Shard, args=["shard"]),
+   })
+   ```
diff --git a/alpacloud/eztag/tag.py b/alpacloud/eztag/tag.py
index 2bc0112..24898d2 100644
--- a/alpacloud/eztag/tag.py
+++ b/alpacloud/eztag/tag.py
@@ -3,7 +3,7 @@
 import re
 from dataclasses import dataclass
 
-from alpacloud.eztag.multidict import MultiDict
+from alpacloud.eztag.multidict import MultiDict, V, K
 
 
 @dataclass
@@ -12,6 +12,14 @@ class TagSet:
 
 	ts: MultiDict
 
+	@classmethod
+	def from_dict(cls, d: dict[K, V]) -> TagSet:
+		return cls(MultiDict.from_dict(d))
+
+	@classmethod
+	def create(cls, d: dict[K, V | list[V]]) -> TagSet:
+		return cls(MultiDict.create(d))
+
 	def has(self, k: str) -> bool:
 		"""Check if the key exists in the tagset"""
 		return k in self.ts

From 56a8008c85368e7ebb28524b11ed21a1a66cf615 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Mon, 24 Nov 2025 00:18:42 -0500
Subject: [PATCH 13/15] doc: more comments and document grammar

---
 alpacloud/eztag/logic.py       | 18 ++++++++++++
 alpacloud/eztag/multidict.py   |  6 ++++
 alpacloud/eztag/parser.py      | 50 ++++++++++++++++++++++++++++------
 alpacloud/eztag/parser_test.py | 20 ++++++++++----
 alpacloud/eztag/readme.md      | 21 ++++++++++++++
 alpacloud/eztag/selector.py    |  5 ++++
 alpacloud/eztag/tag.py         |  6 +++-
 alpacloud/eztag/tag_test.py    |  2 ++
 8 files changed, 113 insertions(+), 15 deletions(-)

diff --git a/alpacloud/eztag/logic.py b/alpacloud/eztag/logic.py
index 6f4a6c4..6df4df0 100644
--- a/alpacloud/eztag/logic.py
+++ b/alpacloud/eztag/logic.py
@@ -1,3 +1,5 @@
+"""Expressions for tag filtering"""
+
 from abc import ABC
 from dataclasses import dataclass
 from typing import Callable
@@ -15,6 +17,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class Cond_(Expr):
+	"""A condition that checks if a tag set satisfies a predicate"""
+
 	f: Callable[[TagSet], bool]
 
 	def check(self, tags: TagSet) -> bool:
@@ -23,6 +27,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class And_(Expr):
+	"""AND of multiple conditions"""
+
 	conds: list[Cond_]
 
 	def check(self, tags: TagSet) -> bool:
@@ -31,6 +37,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class Or_(Expr):
+	"""OR of multiple conditions"""
+
 	conds: list[Cond_]
 
 	def check(self, tags: TagSet) -> bool:
@@ -39,6 +47,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class Not_(Expr):
+	"""Negation of a condition"""
+
 	cond: Cond_
 
 	def check(self, tags: TagSet) -> bool:
@@ -47,6 +57,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class TagHas(Expr):
+	"""Check if a tag set has a given tag, with any value"""
+
 	k: str
 
 	def check(self, tags: TagSet) -> bool:
@@ -55,6 +67,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class TagMatch(Expr):
+	"""Check if a tag set has a given tag with a specific value"""
+
 	k: str
 	v: str | None
 
@@ -64,6 +78,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class TagRematch(Expr):
+	"""Check if a tag set has a given tag with value matching a regular expression"""
+
 	k: str
 	v: str
 
@@ -73,6 +89,8 @@ def check(self, tags: TagSet) -> bool:
 
 @dataclass(frozen=True, slots=True)
 class TagContains(Expr):
+	"""Check if a tag set has a given tag with a specific value"""
+
 	k: str
 	v: str
 
diff --git a/alpacloud/eztag/multidict.py b/alpacloud/eztag/multidict.py
index 7af3087..0344d0c 100644
--- a/alpacloud/eztag/multidict.py
+++ b/alpacloud/eztag/multidict.py
@@ -1,3 +1,5 @@
+"""Generic multidict implementation. A multidict allows multiple values for the same key."""
+
 from __future__ import annotations
 
 from typing import Iterable, TypeAlias, TypeGuard
@@ -24,6 +26,7 @@ def __init__(self):
 
 	@classmethod
 	def from_dict(cls, d: dict[K, V]) -> MultiDict:
+		"""Create a multidict from a dict of key-value pairs"""
 		md = cls()
 		for k, v in d.items():
 			md[k] = {v}
@@ -31,6 +34,9 @@ def from_dict(cls, d: dict[K, V]) -> MultiDict:
 
 	@classmethod
 	def create(cls, d: dict[K, Iterable[V] | V]) -> MultiDict:
+		"""
+		Create a multidict from a dict of key-value pairs or key-list of values pairs
+		"""
 		md = cls()
 		for k, vs in d.items():
 			n: set[V]
diff --git a/alpacloud/eztag/parser.py b/alpacloud/eztag/parser.py
index 8d0bccc..78b8dae 100644
--- a/alpacloud/eztag/parser.py
+++ b/alpacloud/eztag/parser.py
@@ -1,3 +1,13 @@
+"""
+Parse filter expressions into predicates for filtering tags.
+
+The grammar is as follows:
+regex_literal := "/" regex "/"
+string_literal := any characters except "(),/" and spaces
+expr := identifier(expr [, expr])* | regex_literal | string_literal
+identifier := "and" | "or" | "not" | "has" | "match" | "re" | "contains"
+"""
+
 from __future__ import annotations
 
 import abc
@@ -10,13 +20,17 @@
 
 @dataclass
 class ParseState:
+	"""State of the parser"""
+
 	text: str
 	pos: int = 0
 
 	def peek(self) -> Optional[str]:
+		"""Look at the next character in the input text without consuming it"""
 		return self.text[self.pos] if self.pos < len(self.text) else None
 
 	def consume(self) -> Optional[str]:
+		"""Consume the next character from the input text"""
 		if self.pos >= len(self.text):
 			return None
 		char = self.text[self.pos]
@@ -24,6 +38,9 @@ def consume(self) -> Optional[str]:
 		return char
 
 	def consume_while(self, predicate) -> str:
+		"""
+		Consume characters from the input text while the predicate is True
+		"""
 		result = []
 		while self.peek() and predicate(self.peek()):
 			next_result = self.consume()
@@ -33,32 +50,43 @@ def consume_while(self, predicate) -> str:
 
 
 class ASTNode(abc.ABC):
-	pass
+	"""Abstract base class for AST nodes"""
 
 
 @dataclass
 class StringLiteral(ASTNode):
+	"""AST node representing a string literal"""
+
 	value: str
 
 
 @dataclass
 class FunctionCall(ASTNode):
+	"""AST node representing a function call. Everything that isn't a literal is a function call."""
+
 	name: str
-	args: List[ASTNode]
+	args: list[ASTNode]
 
 
 @dataclass
 class RegexLiteral(ASTNode):
+	"""AST node representing a regex literal"""
+
 	value: str
 
 
 class Parser:
+	"""Parses a filter expression into an AST"""
+
 	reserved_chars = set("(),/")
 
 	def __init__(self, text: str):
 		self.state = ParseState(text.strip())
 
 	def parse(self) -> FunctionCall:
+		"""
+		Parse a filter expression into an AST
+		"""
 		return self._parse_function_call()
 
 	def _parse_function_call(self) -> FunctionCall:
@@ -147,6 +175,8 @@ class TokenTransformation:
 
 
 class TokenTransformer:
+	"""Transforms AST nodes into Exprs"""
+
 	def __init__(self, transformations: dict[str, TokenTransformation], case_sensitive_tokens: bool = False):
 		self.case_sensitive_tokens = case_sensitive_tokens
 		if case_sensitive_tokens:
@@ -155,6 +185,7 @@ def __init__(self, transformations: dict[str, TokenTransformation], case_sensiti
 			self.transformations = {k.lower(): v for k, v in transformations.items()}
 
 	def transform(self, token: ASTNode) -> Expr | str:
+		"""Transform an AST node into an Expr"""
 		match token:
 			case StringLiteral():
 				return token.value
@@ -162,21 +193,22 @@ def transform(self, token: ASTNode) -> Expr | str:
 				return token.value
 			case FunctionCall():
 				if self.case_sensitive_tokens:
-					transformer = self.transformations[token.name]
+					transformation = self.transformations[token.name]
 				else:
-					transformer = self.transformations[token.name.lower()]
+					transformation = self.transformations[token.name.lower()]
 
-				if transformer.args == "variadic":
-					return transformer.function([self.transform(e) for e in token.args])  # type: ignore # the typesafety is done by the TokenTransformation
+				if transformation.args == "variadic":
+					return transformation.function([self.transform(e) for e in token.args])  # type: ignore # the typesafety is done by the TokenTransformation
 				else:
-					raw_kwargs = dict(zip(transformer.args, token.args))
+					raw_kwargs = dict(zip(transformation.args, token.args))
 					kwargs = {k: self.transform(v) for k, v in raw_kwargs.items()}
-					return transformer.function(**kwargs)
+					return transformation.function(**kwargs)
 			case _:
 				raise ValueError(f"Unexpected token: {token} of type {type(token)}")
 
 	def extended(self, more_transformers: dict[str, TokenTransformation]) -> TokenTransformer:
-		return TokenTransformer(dict(**self.transformations, **more_transformers), self.case_sensitive_tokens)
+		"""Make a new TokenTransformer with additional transformations. New transformations take precedence over existing ones."""
+		return TokenTransformer({**self.transformations, **more_transformers}, self.case_sensitive_tokens)
 
 
 transformer = TokenTransformer(
diff --git a/alpacloud/eztag/parser_test.py b/alpacloud/eztag/parser_test.py
index 977d59d..836aa70 100644
--- a/alpacloud/eztag/parser_test.py
+++ b/alpacloud/eztag/parser_test.py
@@ -1,9 +1,11 @@
+"""Tests for parser module."""
+
 from dataclasses import dataclass
 
 import pytest
 
 from alpacloud.eztag import logic
-from alpacloud.eztag.logic import TagRematch, TagMatch, And_
+from alpacloud.eztag.logic import And_, TagMatch, TagRematch
 from alpacloud.eztag.parser import FunctionCall, Parser, ParseState, RegexLiteral, StringLiteral, TokenTransformation, TokenTransformer, transformer
 
 
@@ -167,6 +169,10 @@ def test_function_with_empty_arg_between_commas(self):
 		with pytest.raises(ValueError, match="Expected identifier"):
 			parser.parse()
 
+
+class TestParserNested:
+	"""Tests for Parser class with nested function calls."""
+
 	def test_complex_nested_example(self):
 		parser = Parser("outer(inner1(a, b), inner2(c), d)")
 		result = parser.parse()
@@ -230,8 +236,11 @@ def test_regex_literal_with_nesting(self):
 		result = parser.parse()
 		assert result == FunctionCall("match", [StringLiteral("k"), RegexLiteral("match(k, v)")])
 
+
 @dataclass
 class FakeItem:
+	"""Fake item for testing transformer."""
+
 	k: str
 	v: str = "default"
 
@@ -256,8 +265,9 @@ def test_recursive(self):
 
 
 class TestIntegration:
-	def test_example(self):
+	"""Integration tests for Parser and Transformer."""
 
-		filter = "and(match(env, prd), re(name, /grafana.*/))"
-		result = transformer.transform(Parser(filter).parse())
-		assert result == And_(conds=[TagMatch(k='env', v='prd'), TagRematch(k='name', v='grafana.*')])
\ No newline at end of file
+	def test_example(self):
+		filter_str = "and(match(env, prd), re(name, /grafana.*/))"
+		result = transformer.transform(Parser(filter_str).parse())
+		assert result == And_(conds=[TagMatch(k="env", v="prd"), TagRematch(k="name", v="grafana.*")])
diff --git a/alpacloud/eztag/readme.md b/alpacloud/eztag/readme.md
index b9f0c54..ced4306 100644
--- a/alpacloud/eztag/readme.md
+++ b/alpacloud/eztag/readme.md
@@ -76,10 +76,31 @@ Then you can invoke it like this:
 task-run --filter 'and(match(env, prd), re(name, /cert.*/)'
 ```
 
+## CLI filter usage
+
+Filter syntax is:
+```
+regex_literal := "/" regex "/"
+string_literal := any characters except "(),/" and spaces
+expr := identifier(expr [, expr])* | regex_literal | string_literal
+identifier := "and" | "or" | "not" | "has" | "match" | "re" | "contains"
+```
+
+the operations are:
+- `and` : logical AND
+- `or` : logical OR
+- `not` : logical NOT
+- `has` : check if a tag has a key
+- `match` : check if a tag has a key with a value
+- `re` : check if a tag has a key with a value that matches a regex
+- `contains` : check if a tag has a key whose value contains a substring
+
 ## Advanced usage
 
 ### Adding custom filters or operators
 
+You can add your own filters or operators to streamline your usecase. For example, if you shard your tasks, you can add a filter to run only on a specific shard and then filter with `AND(MATCH(env, prd), SHARD(5))` for example.
+
 1. Implement your filter as a subclass of `alpacloud.eztag.logic.Expr`
 
    ```python
diff --git a/alpacloud/eztag/selector.py b/alpacloud/eztag/selector.py
index 3f78f79..64c475d 100644
--- a/alpacloud/eztag/selector.py
+++ b/alpacloud/eztag/selector.py
@@ -1,3 +1,5 @@
+"""Selector items based on their tags. Useful for when tags are external to the data."""
+
 from typing import TypeVar
 
 from alpacloud.eztag.logic import Expr
@@ -5,6 +7,7 @@
 
 Data = TypeVar("Data")
 
+
 class Selector:
 	"""Select items based on their tags"""
 
@@ -12,7 +15,9 @@ def __init__(self, items: list[tuple[TagSet, Data]]):
 		self.items = items
 
 	def select(self, expr: Expr) -> list[Data]:
+		"""Select items based on a predicate"""
 		return [e[1] for e in self.select_with_tags(expr)]
 
 	def select_with_tags(self, expr: Expr) -> list[tuple[TagSet, Data]]:
+		"""Select items based on a predicate, returning their tags as well"""
 		return [e for e in self.items if expr.check(e[0])]
diff --git a/alpacloud/eztag/tag.py b/alpacloud/eztag/tag.py
index 24898d2..e7af026 100644
--- a/alpacloud/eztag/tag.py
+++ b/alpacloud/eztag/tag.py
@@ -1,9 +1,11 @@
+"""TagSet implementation, includes operations on finding tags matching criteria"""
+
 from __future__ import annotations
 
 import re
 from dataclasses import dataclass
 
-from alpacloud.eztag.multidict import MultiDict, V, K
+from alpacloud.eztag.multidict import K, MultiDict, V
 
 
 @dataclass
@@ -14,10 +16,12 @@ class TagSet:
 
 	@classmethod
 	def from_dict(cls, d: dict[K, V]) -> TagSet:
+		"""Create a tagset from a dict of key-value pairs"""
 		return cls(MultiDict.from_dict(d))
 
 	@classmethod
 	def create(cls, d: dict[K, V | list[V]]) -> TagSet:
+		"""Create a tagset from a dict of key-value pairs or key-list of values pairs"""
 		return cls(MultiDict.create(d))
 
 	def has(self, k: str) -> bool:
diff --git a/alpacloud/eztag/tag_test.py b/alpacloud/eztag/tag_test.py
index f7383aa..e0f5669 100644
--- a/alpacloud/eztag/tag_test.py
+++ b/alpacloud/eztag/tag_test.py
@@ -1,3 +1,5 @@
+"""Tests for TagSet class"""
+
 from __future__ import annotations
 
 import re

From 44eccdeeccec300f93c3a76ae79da86ba06269e6 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Mon, 24 Nov 2025 00:22:20 -0500
Subject: [PATCH 14/15] task: typecheck

---
 alpacloud/eztag/selector.py | 4 ++--
 alpacloud/eztag/tag.py      | 3 ++-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/alpacloud/eztag/selector.py b/alpacloud/eztag/selector.py
index 64c475d..bcce757 100644
--- a/alpacloud/eztag/selector.py
+++ b/alpacloud/eztag/selector.py
@@ -1,6 +1,6 @@
 """Selector items based on their tags. Useful for when tags are external to the data."""
 
-from typing import TypeVar
+from typing import Generic, TypeVar
 
 from alpacloud.eztag.logic import Expr
 from alpacloud.eztag.tag import TagSet
@@ -8,7 +8,7 @@
 Data = TypeVar("Data")
 
 
-class Selector:
+class Selector(Generic[Data]):
 	"""Select items based on their tags"""
 
 	def __init__(self, items: list[tuple[TagSet, Data]]):
diff --git a/alpacloud/eztag/tag.py b/alpacloud/eztag/tag.py
index e7af026..fc7072b 100644
--- a/alpacloud/eztag/tag.py
+++ b/alpacloud/eztag/tag.py
@@ -4,6 +4,7 @@
 
 import re
 from dataclasses import dataclass
+from typing import Iterable
 
 from alpacloud.eztag.multidict import K, MultiDict, V
 
@@ -20,7 +21,7 @@ def from_dict(cls, d: dict[K, V]) -> TagSet:
 		return cls(MultiDict.from_dict(d))
 
 	@classmethod
-	def create(cls, d: dict[K, V | list[V]]) -> TagSet:
+	def create(cls, d: dict[K, Iterable[V] | V]) -> TagSet:
 		"""Create a tagset from a dict of key-value pairs or key-list of values pairs"""
 		return cls(MultiDict.create(d))
 

From f76ad209d6d502f20b3a132f8716792fa09713d9 Mon Sep 17 00:00:00 2001
From: Daniel Goldman <danielgoldman4@gmail.com>
Date: Mon, 24 Nov 2025 00:43:19 -0500
Subject: [PATCH 15/15] task: fix build dependency

---
 alpacloud/eztag/BUILD | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/alpacloud/eztag/BUILD b/alpacloud/eztag/BUILD
index f371540..2aabcbb 100644
--- a/alpacloud/eztag/BUILD
+++ b/alpacloud/eztag/BUILD
@@ -12,7 +12,7 @@ python_test_utils(
 python_distribution(
 	name="alpacloud.eztag",
 	repositories=["@alpacloud.eztag"],
-	dependencies=[":lens"],
+	dependencies=[":eztag"],
 	long_description_path="alpacloud/eztag/readme.md",
 	provides=python_artifact(
 		name="alpacloud_eztag",