Skip to content

Commit bf081fb

Browse files
authored
modify patch and workflow (#163)
1 parent f939165 commit bf081fb

File tree

3 files changed

+14
-14
lines changed

3 files changed

+14
-14
lines changed

.github/workflows/unifiedcache_test.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ jobs:
5151
- name: Print debug info
5252
run: |
5353
echo "GITHUB_WORKSPACE is $GITHUB_WORKSPACE"
54-
ls -l $GITHUB_WORKSPACE/unifiedcache/patch
54+
ls -l $GITHUB_WORKSPACE/ucm/patch
5555
5656
- name: Debug repo layout
5757
run: |
@@ -60,7 +60,7 @@ jobs:
6060
ls -l "$GITHUB_WORKSPACE"
6161
- name: Apply patch
6262
run: |
63-
git -C /vllm-workspace/vllm apply $GITHUB_WORKSPACE/unifiedcache/patch/0.9.2/vllm-adapt.patch
63+
git -C /vllm-workspace/vllm apply $GITHUB_WORKSPACE/ucm/patch/0.9.2/vllm-adapt.patch
6464
6565

6666
- name: Install unified-cache-management

ucm/patch/0.9.2/vllm-adapt-sparse.patch

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ index f0ad68b16..847c97371 100644
2121
from vllm.platforms import _Backend, current_platform
2222
from vllm.utils import direct_register_custom_op
2323
from vllm.v1.attention.backends.utils import validate_kv_sharing_target
24-
+from unifiedcache.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
24+
+from ucm.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
2525

2626

2727
class Attention(nn.Module):
@@ -114,8 +114,8 @@ index 6937455e7..3a44db442 100644
114114
from vllm.v1.kv_cache_interface import KVCacheConfig
115115
from vllm.v1.metrics.stats import PrefixCacheStats
116116
from vllm.v1.request import Request, RequestStatus
117-
+from unifiedcache.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
118-
+from unifiedcache.integration.vllm.ucm_sparse.base import INVALID_SLOT
117+
+from ucm.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
118+
+from ucm.integration.vllm.ucm_sparse.base import INVALID_SLOT
119119

120120
logger = init_logger(__name__)
121121

@@ -179,8 +179,8 @@ index 22c0ad8d6..c5c39a2b8 100644
179179
from vllm.v1.spec_decode.metrics import SpecDecodingStats
180180
from vllm.v1.structured_output import StructuredOutputManager
181181

182-
+from unifiedcache.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized, get_ucm_sparse, has_ucm_sparse
183-
+from unifiedcache.integration.vllm.ucm_sparse.base import UcmSparseBase, UcmSparseRole, INVALID_SLOT
182+
+from ucm.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized, get_ucm_sparse, has_ucm_sparse
183+
+from ucm.integration.vllm.ucm_sparse.base import UcmSparseBase, UcmSparseRole, INVALID_SLOT
184184
+
185185
logger = init_logger(__name__)
186186

@@ -313,8 +313,8 @@ index 14278bb6a..84a597b0e 100644
313313
from .utils import (gather_mm_placeholders, initialize_kv_cache_for_kv_sharing,
314314
sanity_check_mm_encoder_outputs, scatter_mm_placeholders)
315315

316-
+from unifiedcache.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
317-
+from unifiedcache.integration.vllm.ucm_sparse.base import UcmSparseMetadata, INVALID_SLOT
316+
+from ucm.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
317+
+from ucm.integration.vllm.ucm_sparse.base import UcmSparseMetadata, INVALID_SLOT
318318
+
319319
if TYPE_CHECKING:
320320
import xgrammar as xgr
@@ -482,7 +482,7 @@ index 7117f60b5..c239e1f02 100644
482482
from vllm.v1.utils import report_usage_stats
483483
from vllm.v1.worker.gpu_model_runner import GPUModelRunner
484484
from vllm.v1.worker.worker_base import WorkerBase
485-
+from unifiedcache.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized
485+
+from ucm.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized
486486

487487
logger = init_logger(__name__)
488488

ucm/patch/0.9.2/vllm-ascend-adapt-sparse.patch

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ index 915feb7..0600f35 100644
1717
from vllm_ascend.utils import (ACL_FORMAT_FRACTAL_NZ, aligned_16, is_310p,
1818
nd_to_nz_2d, nd_to_nz_spec)
1919

20-
+from unifiedcache.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
20+
+from ucm.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
2121
+
2222

2323
class AscendAttentionBackend(AttentionBackend):
@@ -91,8 +91,8 @@ index f9cca93..31766b2 100644
9191
from vllm_ascend.worker.mtp_proposer_v1 import MtpProposer
9292
from vllm_ascend.worker.npu_input_batch import CachedRequestState, InputBatch
9393

94-
+from unifiedcache.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
95-
+from unifiedcache.integration.vllm.ucm_sparse.base import UcmSparseMetadata, INVALID_SLOT
94+
+from ucm.integration.vllm.ucm_sparse.state import get_ucm_sparse, has_ucm_sparse
95+
+from ucm.integration.vllm.ucm_sparse.base import UcmSparseMetadata, INVALID_SLOT
9696
+
9797
if TYPE_CHECKING:
9898
import xgrammar as xgr # type: ignore[import-untyped]
@@ -250,7 +250,7 @@ index df03d50..6ea5bf3 100644
250250
read_kv_cache_bytes_from_file,
251251
sleep_mode_enabled, try_register_lib)
252252
from vllm_ascend.worker.model_runner_v1 import NPUModelRunner
253-
+from unifiedcache.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized
253+
+from ucm.integration.vllm.ucm_sparse.state import ensure_ucm_sparse_initialized
254254

255255

256256
class NPUWorker(WorkerBase):

0 commit comments

Comments
 (0)