Jean-Michaël Celerier jcelerier

## memcount_sse2.c
size_t memcount_sse2(const void *s, int c, size_t n) {
    __m128i cv = _mm_set1_epi8(c), sum = _mm_setzero_si128(), acr0,acr1,acr2,acr3;
    const char *p,*pe;
	for(p = s; p != (char *)s+(n- (n % (252*16)));) {
	  for(acr0 = acr1 = acr2 = acr3 = _mm_setzero_si128(),pe = p+252*16; p != pe; p += 64) {
		acr0 = _mm_add_epi8(acr0, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)p)));
		acr1 = _mm_add_epi8(acr1, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+16))));
		acr2 = _mm_add_epi8(acr2, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+32))));
		acr3 = _mm_add_epi8(acr3, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+48)))); __builtin_prefetch(p+1024);
	  }

## gist:516dba19737a498ce72d
#include <tuple>
#include <initializer_list>
#include <math.h>
#include <utility>

using namespace std;


template <typename Tup1, typename Tup2, size_t...s>
double euclidean_distance_impl (Tup1 const &tup1, Tup2 const &tup2, index_sequence<s...>)

## really_strong_typedef.cc
#include <type_traits>
#include <iostream>

#define REALLY_STRONG_TYPEDEF(From, To)                 \
  class To final {                                      \
    static_assert(std::is_scalar<From>(), "");          \
    From x;                                             \
                                                        \
   public:                                              \
    To() = default;                                     \

## gist:ca0ceb224ea789415387

# Install quemu, docker, etc
yaourt -S qemu qemu-user-static binfmt-support

# The quemu-user-static AUR package is outdated and broken. The .deb package they pull is no longer in the ubuntu repository.
# Edit the PKGBUILD and use qemu-user-static_2.4+dfsg-3_amd64.deb (With SHA1 sum "84d83a16c60c82b6c579f2f750b04a3ac26c249b")

# Enable ARM emulation
update-binfmts --enable qemu-arm

## vector_view.cpp
// vector_view class, based on code by James exjam https://github.com/exjam/string_view
// rlyeh, public domain

#pragma once
#include <vector>

#if defined(_MSC_VER) && _MSC_VER < 1900
#define constexpr
#define noexcept
#endif

## gist:a7adca91bba7089ba47b

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              1 star
            
          
                philipz
                / gist:a7adca91bba7089ba47b
            
            
              Created
              February 17, 2015 08:50
            
              
                Run RPi Raspbian on Docker 
              
          
    docker run -it --rm -v /usr/bin/qemu-arm-static:/usr/bin/qemu-arm-static philipz/rpi-raspbian bash

  
## CMakeLists.txt
cmake_minimum_required(VERSION 2.8.11)

project(VtkFboInQtQuick)

set(CMAKE_INCLUDE_CURRENT_DIR ON)
set(CMAKE_AUTOMOC ON)

find_package(VTK REQUIRED)
include(${VTK_USE_FILE})

## howtogif
How to convert a video file to an animated GIF on Linux:

Install required software:
apt-get install ffmpeg gifsicle imagemagick:
Convert the video file to a series of small images:
mkdir /tmp/gif/
ffmpeg -i YOURVIDEOFILE.mp4 -r 10 /tmp/gif/out%04d.gif
Combine these images together into a GIF animation:
gifsicle –delay=10 –loop /tmp/gif/*.gif > animation.gif
Optimise the GIF animation so the file size is smaller:

## magic_ring.cpp
#define _CRT_SECURE_NO_DEPRECATE

#include <stdio.h>
#include <string.h>
#include <Windows.h>

// This allocates a "magic ring buffer" that is mapped twice, with the two
// copies being contiguous in (virtual) memory. The advantage of this is
// that this allows any function that expects data to be contiguous in
// memory to read from (or write to) such a buffer. It also means that

## latency.markdown

      
              2 files
            
          
              742 forks
            
          
              50 comments
            
          
              4390 stars
            
          
                hellerbarde
                / latency.markdown
            
            
              Created
              May 31, 2012 13:16
                — forked from jboner/latency.txt
            
              
                Latency numbers every programmer should know
              
          
    Latency numbers every programmer should know

L1 cache reference ......................... 0.5 ns
Branch mispredict ............................ 5 ns
L2 cache reference ........................... 7 ns
Mutex lock/unlock ........................... 25 ns
Main memory reference ...................... 100 ns             
Compress 1K bytes with Zippy ............. 3,000 ns  =   3 µs
Send 2K bytes over 1 Gbps network ....... 20,000 ns  =  20 µs
SSD random read ........................ 150,000 ns  = 150 µs

Read 1 MB sequentially from memory ..... 250,000 ns = 250 µs
	size_t memcount_sse2(const void *s, int c, size_t n) {
	__m128i cv = _mm_set1_epi8(c), sum = _mm_setzero_si128(), acr0,acr1,acr2,acr3;
	const char p,pe;
	for(p = s; p != (char )s+(n- (n % (25216)));) {
	for(acr0 = acr1 = acr2 = acr3 = _mm_setzero_si128(),pe = p+252*16; p != pe; p += 64) {
	acr0 = _mm_add_epi8(acr0, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)p)));
	acr1 = _mm_add_epi8(acr1, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+16))));
	acr2 = _mm_add_epi8(acr2, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+32))));
	acr3 = _mm_add_epi8(acr3, _mm_cmpeq_epi8(cv, _mm_loadu_si128((const __m128i *)(p+48)))); __builtin_prefetch(p+1024);
	}
	#include <tuple>
	#include <initializer_list>
	#include <math.h>
	#include <utility>

	using namespace std;


	template <typename Tup1, typename Tup2, size_t...s>
	double euclidean_distance_impl (Tup1 const &tup1, Tup2 const &tup2, index_sequence<s...>)
	#include <type_traits>
	#include <iostream>

	#define REALLY_STRONG_TYPEDEF(From, To) \
	class To final { \
	static_assert(std::is_scalar<From>(), ""); \
	From x; \
	\
	public: \
	To() = default; \

	# Install quemu, docker, etc
	yaourt -S qemu qemu-user-static binfmt-support

	# The quemu-user-static AUR package is outdated and broken. The .deb package they pull is no longer in the ubuntu repository.
	# Edit the PKGBUILD and use qemu-user-static_2.4+dfsg-3_amd64.deb (With SHA1 sum "84d83a16c60c82b6c579f2f750b04a3ac26c249b")

	# Enable ARM emulation
	update-binfmts --enable qemu-arm
	// vector_view class, based on code by James exjam https://github.com/exjam/string_view
	// rlyeh, public domain

	#pragma once
	#include <vector>

	#if defined(_MSC_VER) && _MSC_VER < 1900
	#define constexpr
	#define noexcept
	#endif
	cmake_minimum_required(VERSION 2.8.11)

	project(VtkFboInQtQuick)

	set(CMAKE_INCLUDE_CURRENT_DIR ON)
	set(CMAKE_AUTOMOC ON)

	find_package(VTK REQUIRED)
	include(${VTK_USE_FILE})
	How to convert a video file to an animated GIF on Linux:

	Install required software:
	apt-get install ffmpeg gifsicle imagemagick:
	Convert the video file to a series of small images:
	mkdir /tmp/gif/
	ffmpeg -i YOURVIDEOFILE.mp4 -r 10 /tmp/gif/out%04d.gif
	Combine these images together into a GIF animation:
	gifsicle –delay=10 –loop /tmp/gif/*.gif > animation.gif
	Optimise the GIF animation so the file size is smaller:
	#define _CRT_SECURE_NO_DEPRECATE

	#include <stdio.h>
	#include <string.h>
	#include <Windows.h>

	// This allocates a "magic ring buffer" that is mapped twice, with the two
	// copies being contiguous in (virtual) memory. The advantage of this is
	// that this allows any function that expects data to be contiguous in
	// memory to read from (or write to) such a buffer. It also means that