Skip to content

Commit

Permalink
Diffusion model case
Browse files Browse the repository at this point in the history
  • Loading branch information
EricLBuehler committed Sep 18, 2024
1 parent 8dd0000 commit 9153aff
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion mistralrs-core/src/engine/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -77,7 +77,10 @@ impl Engine {
let device = get_mut_arcmutex!(pipeline).device().clone();
let is_xlora = get_mut_arcmutex!(pipeline).get_metadata().is_xlora;
let has_no_kv_cache = get_mut_arcmutex!(pipeline).get_metadata().has_no_kv_cache;
assert_eq!(has_no_kv_cache, no_kv_cache);
if no_kv_cache {
// Diffusion models...
assert_eq!(has_no_kv_cache, no_kv_cache);
}
// Prefix caching is always disabled if using PagedAttention for now.
// TODO
let no_prefix_cache = matches!(config, SchedulerConfig::PagedAttentionMeta { .. })
Expand Down

0 comments on commit 9153aff

Please sign in to comment.