Re: [PR] [Test] Add test for filelock utility [tvm-ffi]

via GitHub Sun, 02 Nov 2025 13:33:07 -0800


gemini-code-assist[bot] commented on code in PR #216:
URL: https://github.com/apache/tvm-ffi/pull/216#discussion_r2485031693



##########
tests/python/utils/test_filelock.py:
##########
@@ -0,0 +1,163 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""Tests for the FileLock utility."""
+
+import subprocess
+import sys
+import tempfile
+from pathlib import Path
+
+import pytest
+from tvm_ffi.utils.lockfile import FileLock
+
+
+def test_basic_lock_acquire_and_release() -> None:
+    """Test basic lock acquisition and release."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # Test acquire
+        assert lock.acquire() is True
+        assert lock._file_descriptor is not None
+
+        # Test release
+        lock.release()
+        assert lock._file_descriptor is None
+
+
+def test_context_manager() -> None:
+    """Test FileLock as a context manager."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        with FileLock(str(lock_path)) as lock:
+            assert lock._file_descriptor is not None
+            # Lock should be acquired
+            assert lock_path.exists()
+
+        # Lock should be released after exiting context
+        # Note: file may still exist but should be unlocked
+
+
+def test_multiple_acquire_attempts() -> None:
+    """Test multiple acquire attempts on the same lock instance."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # First acquire should succeed
+        assert lock.acquire() is True
+
+        # Second acquire on same instance should fail
+        # (can't acquire same lock twice)
+        assert lock.acquire() is False
+
+        lock.release()
+
+
+def test_exception_in_context_manager() -> None:
+    """Test that lock is properly released even when exception occurs."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        # Test that exception is propagated and lock is released
+        with pytest.raises(ValueError, match="test exception"):
+            with FileLock(str(lock_path)) as lock:
+                assert lock._file_descriptor is not None
+                raise ValueError("test exception")
+
+        # Lock should be released, so we can acquire it again
+        lock2 = FileLock(str(lock_path))
+        assert lock2.acquire() is True
+        lock2.release()
+
+
+concurrent_worker_script = '''
+import sys
+import time
+import random
+from pathlib import Path
+from tvm_ffi.utils.lockfile import FileLock
+
+def worker(worker_id, lock_path, counter_file):
+    """Worker function that tries to acquire lock and increment counter."""
+    try:
+        with FileLock(lock_path):
+            # Critical section - read, increment, write counter
+            with open(counter_file, 'r') as f:
+                current_value = int(f.read().strip())
+
+            time.sleep(random.uniform(0.01, 0.1))  # Simulate some work
+
+            with open(counter_file, 'w') as f:
+                f.write(str(current_value + 1))
+
+            print(f"Worker {worker_id}: success")
+            return 0
+    except Exception as e:
+        print(f"Worker {worker_id}: error: {e}")
+        return 1
+
+if __name__ == "__main__":
+    worker_id = int(sys.argv[1])
+    lock_path = sys.argv[2]
+    counter_file = sys.argv[3]
+    sys.exit(worker(worker_id, lock_path, counter_file))
+'''

Review Comment:
   ![medium](https://www.gstatic.com/codereviewagent/medium-priority.svg)
   
   Embedding a significant script as a multi-line string can harm 
maintainability. It's hard to read, and tools like linters and syntax 
highlighters won't work on it. For better code organization and easier 
debugging, consider moving this worker script to a separate helper file (e.g., 
`tests/python/utils/filelock_worker.py`) and invoking that from the test.



##########
tests/python/utils/test_filelock.py:
##########
@@ -0,0 +1,163 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""Tests for the FileLock utility."""
+
+import subprocess
+import sys
+import tempfile
+from pathlib import Path
+
+import pytest
+from tvm_ffi.utils.lockfile import FileLock
+
+
+def test_basic_lock_acquire_and_release() -> None:
+    """Test basic lock acquisition and release."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # Test acquire
+        assert lock.acquire() is True
+        assert lock._file_descriptor is not None
+
+        # Test release
+        lock.release()
+        assert lock._file_descriptor is None
+
+
+def test_context_manager() -> None:
+    """Test FileLock as a context manager."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        with FileLock(str(lock_path)) as lock:
+            assert lock._file_descriptor is not None
+            # Lock should be acquired
+            assert lock_path.exists()
+
+        # Lock should be released after exiting context
+        # Note: file may still exist but should be unlocked
+
+
+def test_multiple_acquire_attempts() -> None:
+    """Test multiple acquire attempts on the same lock instance."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # First acquire should succeed
+        assert lock.acquire() is True
+
+        # Second acquire on same instance should fail
+        # (can't acquire same lock twice)
+        assert lock.acquire() is False
+
+        lock.release()
+
+
+def test_exception_in_context_manager() -> None:
+    """Test that lock is properly released even when exception occurs."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        # Test that exception is propagated and lock is released
+        with pytest.raises(ValueError, match="test exception"):
+            with FileLock(str(lock_path)) as lock:
+                assert lock._file_descriptor is not None
+                raise ValueError("test exception")
+
+        # Lock should be released, so we can acquire it again
+        lock2 = FileLock(str(lock_path))
+        assert lock2.acquire() is True
+        lock2.release()
+
+
+concurrent_worker_script = '''
+import sys
+import time
+import random
+from pathlib import Path
+from tvm_ffi.utils.lockfile import FileLock
+
+def worker(worker_id, lock_path, counter_file):
+    """Worker function that tries to acquire lock and increment counter."""
+    try:
+        with FileLock(lock_path):
+            # Critical section - read, increment, write counter
+            with open(counter_file, 'r') as f:
+                current_value = int(f.read().strip())
+
+            time.sleep(random.uniform(0.01, 0.1))  # Simulate some work
+
+            with open(counter_file, 'w') as f:
+                f.write(str(current_value + 1))
+
+            print(f"Worker {worker_id}: success")
+            return 0
+    except Exception as e:
+        print(f"Worker {worker_id}: error: {e}")
+        return 1
+
+if __name__ == "__main__":
+    worker_id = int(sys.argv[1])
+    lock_path = sys.argv[2]
+    counter_file = sys.argv[3]
+    sys.exit(worker(worker_id, lock_path, counter_file))
+'''
+
+
+def test_concurrent_access() -> None:
+    """Test concurrent access from multiple processes."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        counter_file = Path(temp_dir) / "counter.txt"
+
+        # Initialize counter file
+        counter_file.write_text("0")
+
+        # Create worker script content
+
+        # Write worker script to a temporary file
+        worker_script_path = Path(temp_dir) / "worker.py"
+        worker_script_path.write_text(concurrent_worker_script)
+
+        # Run multiple worker processes concurrently
+        num_workers = 16
+        processes = []
+        for i in range(num_workers):
+            p = subprocess.Popen(
+                [sys.executable, str(worker_script_path), str(i), 
str(lock_path), str(counter_file)]
+            )
+            processes.append(p)
+
+        # Wait for all processes to complete
+        for p in processes:
+            p.wait(timeout=num_workers)  # wait for `num_workers` seconds at 
most

Review Comment:
   ![medium](https://www.gstatic.com/codereviewagent/medium-priority.svg)
   
   The timeout for `p.wait()` is set to `num_workers` seconds. This is a bit 
arbitrary and might be too short or too long depending on system load. A more 
robust approach is to calculate the timeout based on the test's parameters. For 
instance, since each worker sleeps for up to 0.1s and performs some I/O, a 
timeout like `num_workers * 0.5` would provide a generous buffer while being 
more principled.
   
   ```suggestion
               p.wait(timeout=num_workers * 0.5)  # wait for a calculated 
timeout
   ```



##########
python/tvm_ffi/utils/lockfile.py:
##########
@@ -97,10 +105,17 @@ def acquire(self) -> bool:
     def blocking_acquire(self, timeout: float | None = None, poll_interval: 
float = 0.1) -> bool:
         """Wait until an exclusive lock can be acquired, with an optional 
timeout.
 
-        Args:
-            timeout (float): The maximum time to wait for the lock in seconds.
-                             A value of None means wait indefinitely.
-            poll_interval (float): The time to wait between lock attempts in 
seconds.
+        Parameters
+        ----------
+        timeout: float:
+            The maximum time to wait for the lock in seconds.  A value of None 
means wait indefinitely.
+        poll_interval: float
+            The time to wait between lock attempts in seconds.
+
+        Returns
+        -------
+        ret: bool
+            True if the lock was acquired, False otherwise.
 
         """

Review Comment:
   ![high](https://www.gstatic.com/codereviewagent/high-priority.svg)
   
   The updated docstring is an improvement, but it has some issues:
   
   *   **Inconsistency**: It states the method returns a `bool` (`True` on 
success, `False` otherwise), but the implementation actually raises a 
`TimeoutError` if the lock isn't acquired within the timeout period. It never 
returns `False`. Since the context manager (`__enter__`) relies on this 
exception, the docstring should be updated to document the `TimeoutError`.
   *   **Typo**: There's a typo in the `timeout` parameter description: 
`timeout: float:`.
   *   **Re-acquisition Bug**: A more critical issue is that `blocking_acquire` 
will now loop until timeout if called on an instance that already holds the 
lock. This is because `acquire()` returns `False`, and the method doesn't 
distinguish this case from a lock held by another process. This should be fixed 
by adding a check at the start of `blocking_acquire`'s body (e.g., `if 
self._file_descriptor is not None: raise RuntimeError(...)`). Since the method 
body is not in the diff, I can't suggest the code change, but it's a critical 
fix to consider.
   
   Here is a suggested update for the docstring to make it accurate.
   
   ```python
           """Wait until an exclusive lock can be acquired, with an optional 
timeout.
   
           Parameters
           ----------
           timeout: float, optional
               The maximum time to wait for the lock in seconds.  A value of 
None means wait indefinitely.
           poll_interval: float
               The time to wait between lock attempts in seconds.
   
           Returns
           -------
           ret: bool
               True if the lock was acquired.
   
           Raises
           ------
           TimeoutError
               If the lock is not acquired within the timeout period.
   
           """
   ```



##########
tests/python/utils/test_filelock.py:
##########
@@ -0,0 +1,163 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""Tests for the FileLock utility."""
+
+import subprocess
+import sys
+import tempfile
+from pathlib import Path
+
+import pytest
+from tvm_ffi.utils.lockfile import FileLock
+
+
+def test_basic_lock_acquire_and_release() -> None:
+    """Test basic lock acquisition and release."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # Test acquire
+        assert lock.acquire() is True
+        assert lock._file_descriptor is not None
+
+        # Test release
+        lock.release()
+        assert lock._file_descriptor is None
+
+
+def test_context_manager() -> None:
+    """Test FileLock as a context manager."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        with FileLock(str(lock_path)) as lock:
+            assert lock._file_descriptor is not None
+            # Lock should be acquired
+            assert lock_path.exists()
+
+        # Lock should be released after exiting context
+        # Note: file may still exist but should be unlocked
+
+
+def test_multiple_acquire_attempts() -> None:
+    """Test multiple acquire attempts on the same lock instance."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        lock = FileLock(str(lock_path))
+
+        # First acquire should succeed
+        assert lock.acquire() is True
+
+        # Second acquire on same instance should fail
+        # (can't acquire same lock twice)
+        assert lock.acquire() is False
+
+        lock.release()
+
+
+def test_exception_in_context_manager() -> None:
+    """Test that lock is properly released even when exception occurs."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+
+        # Test that exception is propagated and lock is released
+        with pytest.raises(ValueError, match="test exception"):
+            with FileLock(str(lock_path)) as lock:
+                assert lock._file_descriptor is not None
+                raise ValueError("test exception")
+
+        # Lock should be released, so we can acquire it again
+        lock2 = FileLock(str(lock_path))
+        assert lock2.acquire() is True
+        lock2.release()
+
+
+concurrent_worker_script = '''
+import sys
+import time
+import random
+from pathlib import Path
+from tvm_ffi.utils.lockfile import FileLock
+
+def worker(worker_id, lock_path, counter_file):
+    """Worker function that tries to acquire lock and increment counter."""
+    try:
+        with FileLock(lock_path):
+            # Critical section - read, increment, write counter
+            with open(counter_file, 'r') as f:
+                current_value = int(f.read().strip())
+
+            time.sleep(random.uniform(0.01, 0.1))  # Simulate some work
+
+            with open(counter_file, 'w') as f:
+                f.write(str(current_value + 1))
+
+            print(f"Worker {worker_id}: success")
+            return 0
+    except Exception as e:
+        print(f"Worker {worker_id}: error: {e}")
+        return 1
+
+if __name__ == "__main__":
+    worker_id = int(sys.argv[1])
+    lock_path = sys.argv[2]
+    counter_file = sys.argv[3]
+    sys.exit(worker(worker_id, lock_path, counter_file))
+'''
+
+
+def test_concurrent_access() -> None:
+    """Test concurrent access from multiple processes."""
+    with tempfile.TemporaryDirectory() as temp_dir:
+        lock_path = Path(temp_dir) / "test.lock"
+        counter_file = Path(temp_dir) / "counter.txt"
+
+        # Initialize counter file
+        counter_file.write_text("0")
+
+        # Create worker script content
+
+        # Write worker script to a temporary file
+        worker_script_path = Path(temp_dir) / "worker.py"
+        worker_script_path.write_text(concurrent_worker_script)
+
+        # Run multiple worker processes concurrently
+        num_workers = 16
+        processes = []
+        for i in range(num_workers):
+            p = subprocess.Popen(
+                [sys.executable, str(worker_script_path), str(i), 
str(lock_path), str(counter_file)]
+            )
+            processes.append(p)
+
+        # Wait for all processes to complete
+        for p in processes:
+            p.wait(timeout=num_workers)  # wait for `num_workers` seconds at 
most
+            assert p.returncode == 0, f"Worker process failed with return code 
{p.returncode}"
+
+        # Check final counter value
+        final_count = int(counter_file.read_text().strip())
+
+        print(final_count, file=sys.stderr)

Review Comment:
   ![medium](https://www.gstatic.com/codereviewagent/medium-priority.svg)
   
   This `print` statement appears to be for debugging. It's best to remove it 
from the final test code to avoid cluttering the test output.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Re: [PR] [Test] Add test for filelock utility [tvm-ffi]

Reply via email to