svjack
/

sd-ggml-cpp-dp

Model card Files Files and versions

sd-ggml-cpp-dp / stable-diffusion.cpp /ggml /examples /mnist /main-cpu.cpp

svjack's picture

Upload folder using huggingface_hub

13d3ba0 over 1 year ago

3.54 kB

	// Use a pre-generated MNIST compute graph for inference on the CPU
	//
	// You can generate a compute graph using the "mnist" tool:
	//
	// $ ./bin/mnist ./models/mnist/ggml-model-f32.bin ../examples/mnist/models/mnist/t10k-images.idx3-ubyte
	//
	// This command creates the "mnist.ggml" file, which contains the generated compute graph.
	// Now, you can re-use the compute graph with the "mnist-cpu" tool:
	//
	// $ ./bin/mnist-cpu ./models/mnist/mnist.ggml ../examples/mnist/models/mnist/t10k-images.idx3-ubyte
	//

	#include "ggml/ggml.h"

	#include <algorithm>
	#include <cmath>
	#include <cstdio>
	#include <cstring>
	#include <ctime>
	#include <fstream>
	#include <vector>

	#if defined(_MSC_VER)
	#pragma warning(disable: 4244 4267) // possible loss of data
	#endif

	// evaluate the MNIST compute graph
	//
	// - fname_cgraph: path to the compute graph
	// - n_threads: number of threads to use
	// - digit: 784 pixel values
	//
	// returns 0 - 9 prediction
	int mnist_eval(
	const char * fname_cgraph,
	const int n_threads,
	std::vector<float> digit) {
	// load the compute graph
	struct ggml_context * ctx_data = NULL;
	struct ggml_context * ctx_eval = NULL;

	struct ggml_cgraph gfi = ggml_graph_import(fname_cgraph, &ctx_data, &ctx_eval);

	// param export/import test
	GGML_ASSERT(ggml_graph_get_tensor(&gfi, "fc1_bias")->op_params[0] == int(0xdeadbeef));

	// allocate work context
	// needed during ggml_graph_compute() to allocate a work tensor
	static size_t buf_size = 128ull10241024; // TODO
	static void * buf = malloc(buf_size);

	struct ggml_init_params params = {
	/.mem_size =/ buf_size,
	/.mem_buffer =/ buf,
	/.no_alloc =/ false,
	};

	struct ggml_context * ctx_work = ggml_init(params);

	struct ggml_tensor * input = ggml_graph_get_tensor(&gfi, "input");
	memcpy(input->data, digit.data(), ggml_nbytes(input));

	ggml_graph_compute_with_ctx(ctx_work, &gfi, n_threads);

	const float * probs_data = ggml_get_data_f32(ggml_graph_get_tensor(&gfi, "probs"));

	const int prediction = std::max_element(probs_data, probs_data + 10) - probs_data;

	ggml_free(ctx_work);
	ggml_free(ctx_data);
	ggml_free(ctx_eval);

	return prediction;
	}

	int main(int argc, char ** argv) {
	srand(time(NULL));
	ggml_time_init();

	if (argc != 3) {
	fprintf(stderr, "Usage: %s models/mnist/mnist.ggml models/mnist/t10k-images.idx3-ubyte\n", argv[0]);
	exit(0);
	}

	uint8_t buf[784];
	std::vector<float> digit;

	// read a random digit from the test set
	{
	std::ifstream fin(argv[2], std::ios::binary);
	if (!fin) {
	fprintf(stderr, "%s: failed to open '%s'\n", __func__, argv[2]);
	return 1;
	}

	// seek to a random digit: 16-byte header + 2828 (random 0 - 10000)
	fin.seekg(16 + 784 * (rand() % 10000));
	fin.read((char *) &buf, sizeof(buf));
	}

	// render the digit in ASCII
	{
	digit.resize(sizeof(buf));

	for (int row = 0; row < 28; row++) {
	for (int col = 0; col < 28; col++) {
	fprintf(stderr, "%c ", (float)buf[row28 + col] > 230 ? '' : '_');
	digit[row28 + col] = ((float)buf[row28 + col]);
	}

	fprintf(stderr, "\n");
	}

	fprintf(stderr, "\n");
	}

	const int prediction = mnist_eval(argv[1], 1, digit);

	fprintf(stdout, "%s: predicted digit is %d\n", __func__, prediction);

	return 0;
	}