Skip to content

Commit

Permalink
Merge branch 'concedo_experimental' into croco_nex_0
Browse files Browse the repository at this point in the history
  • Loading branch information
Nexesenex committed Nov 8, 2024
2 parents 90084dc + 47968e6 commit c8ab2a2
Show file tree
Hide file tree
Showing 7 changed files with 9 additions and 7 deletions.
1 change: 1 addition & 0 deletions ggml/src/ggml-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -149,6 +149,7 @@ static ggml_cuda_device_info ggml_cuda_init() {
//#else
// GGML_LOG_INFO("%s: GGML_CUDA_FORCE_CUBLAS: no\n", __func__);
//#endif // GGML_CUDA_FORCE_CUBLAS
GGML_LOG_INFO("Initializing CUDA, please wait, this might take a while for first run...\n", __func__, info.device_count);
GGML_LOG_INFO("%s: found %d " GGML_CUDA_NAME " devices:\n", __func__, info.device_count);
for (int id = 0; id < info.device_count; ++id) {
int device_vmm = 0;
Expand Down
2 changes: 1 addition & 1 deletion ggml/src/ggml-cuda/fattn-tile-f16.cu
Original file line number Diff line number Diff line change
Expand Up @@ -310,7 +310,7 @@ void ggml_cuda_flash_attn_ext_tile_f16(ggml_backend_cuda_context & ctx, ggml_ten
const ggml_tensor * Q = dst->src[0];

const int32_t precision = KQV->op_params[3];
GGML_ASSERT(precision == GGML_PREC_DEFAULT);
// GGML_ASSERT_CONTINUE(precision == GGML_PREC_DEFAULT);

float logit_softcap;
memcpy(&logit_softcap, (const float *) KQV->op_params + 2, sizeof(float));
Expand Down
2 changes: 1 addition & 1 deletion ggml/src/ggml-cuda/fattn-vec-f16.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -315,7 +315,7 @@ void ggml_cuda_flash_attn_ext_vec_f16_case(ggml_backend_cuda_context & ctx, ggml
const ggml_tensor * V = dst->src[2];

const int32_t precision = KQV->op_params[3];
GGML_ASSERT(precision == GGML_PREC_DEFAULT);
// GGML_ASSERT_CONTINUE(precision == GGML_PREC_DEFAULT);

GGML_ASSERT(K->type == type_K);
GGML_ASSERT(V->type == type_V);
Expand Down
2 changes: 1 addition & 1 deletion include/vulkan/spirv_cross/spirv_msl.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -682,7 +682,7 @@ class CompilerMSL : public CompilerGLSL

// Same as get_automatic_msl_resource_binding, but should only be used for combined image samplers, in which case the
// sampler's binding is returned instead. For any other resource type, -1 is returned.
// Secondary bindings are also used for the auxillary image atomic buffer.
// Secondary bindings are also used for the auxiliary image atomic buffer.
uint32_t get_automatic_msl_resource_binding_secondary(uint32_t id) const;

// Same as get_automatic_msl_resource_binding, but should only be used for combined image samplers for multiplanar images,
Expand Down
7 changes: 5 additions & 2 deletions klite.embd
Original file line number Diff line number Diff line change
Expand Up @@ -12645,14 +12645,14 @@ Current version indicated by LITEVER below.
//memory is allowed to be up to 0.8 times of ctx allowance, anote up to 0.6 times
let max_mem_len = Math.floor(max_allowed_characters*0.8);
let max_anote_len = Math.floor(max_allowed_characters*0.6);
let max_wi_len = Math.floor(max_allowed_characters*0.7);
let max_wi_len = Math.floor(max_allowed_characters*0.5);
let appendedsysprompt = "";
if(localsettings.opmode==4 && localsettings.instruct_sysprompt!="")
{
max_mem_len = Math.floor(max_allowed_characters*0.7);
appendedsysprompt = get_instruct_systag(false) + localsettings.instruct_sysprompt + "\n";
}
let truncated_memory = appendedsysprompt + substring_to_boundary(current_memory, max_mem_len);
let truncated_memory = substring_to_boundary(current_memory, max_mem_len);
if (truncated_memory != null && truncated_memory != "") {
if(newlineaftermemory)
{
Expand Down Expand Up @@ -12783,12 +12783,15 @@ Current version indicated by LITEVER below.
if(wi_insertlocation>0)
{
truncated_anote = wistr + truncated_anote;
truncated_anote = substring_to_boundary(truncated_anote, max_anote_len);
}
else
{
truncated_memory += wistr;
}

truncated_memory = appendedsysprompt + substring_to_boundary(truncated_memory, max_mem_len);

//now we resize the context such that the memory and authors note can fit inside
truncated_context = substring_to_boundary(truncated_context, max_allowed_characters);

Expand Down
1 change: 0 additions & 1 deletion otherarch/sdcpp/stable-diffusion.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -162,7 +162,6 @@ class StableDiffusionGGML {
#endif
#ifdef SD_USE_METAL
LOG_DEBUG("Using Metal backend");
ggml_backend_metal_log_set_callback(ggml_log_callback_default, nullptr);
backend = ggml_backend_metal_init();
#endif
#ifdef SD_USE_VULKAN
Expand Down
1 change: 0 additions & 1 deletion otherarch/sdcpp/upscaler.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,6 @@ struct UpscalerGGML {
#endif
#ifdef SD_USE_METAL
LOG_DEBUG("Using Metal backend");
ggml_backend_metal_log_set_callback(ggml_log_callback_default, nullptr);
backend = ggml_backend_metal_init();
#endif
#ifdef SD_USE_VULKAN
Expand Down

0 comments on commit c8ab2a2

Please sign in to comment.