Meng Wei weimeng23

## CMakeLists.txt
cmake_minimum_required(VERSION 3.14 FATAL_ERROR)

# 设置项目名称
project(LearnCmake VERSION 1.0 LANGUAGES CXX)

# 添加可执行文件
add_library(add STATIC add.cc)

add_executable(main main.cc)

## install_glibc.sh
wget https://github.com/bminor/glibc/archive/refs/tags/glibc-2.35.tar.gz
tar xvf glibc-2.35.tar.gz
cd glibc-glibc-2.35
mkdir build
cd build
../configure --prefix=/path/to/install
make -j10
make install

## logger.py
logger = logging.getLogger(__name__)
logger.setLevel(level=logging.DEBUG)

formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
formatter = logging.Formatter('%(asctime)s | %(levelname)s | %(filename)s | %(threadName)s | %(funcName)s | %(lineno)s | %(message)s')

fh = logging.FileHandler("log.txt")
fh.setLevel(logging.INFO)
fh.setFormatter(formatter)
logger.addHandler(fh)

## export_bert_onnx.py
class MyBertForSequenceClassification(BertForSequenceClassification):
    def forward(self, input_ids=None, attention_mask=None, token_type_ids=None):
        outputs = super().forward(
            input_ids=input_ids,
            attention_mask=attention_mask,
            token_type_ids=token_type_ids,
        )
        return outputs.logits


## M365Princess.omp.json
{
  "$schema": "https://raw.githubusercontent.com/JanDeDobbeleer/oh-my-posh/main/themes/schema.json",
  "palette": {
    "white": "#FFFFFF",
    "tan": "#CC3802",
    "teal": "#047E84",
    "plum": "#9A348E",
    "blush": "#DA627D",
    "salmon": "#FCA17D",
    "sky": "#86BBD8",

## 24-bit-truecolor.sh
#!/bin/bash
#
#   This file echoes four gradients with 24-bit color codes
#   to the terminal to demonstrate their functionality.
#   The foreground escape sequence is ^[38;2;<r>;<g>;<b>m
#   The background escape sequence is ^[48;2;<r>;<g>;<b>m
#   <r> <g> <b> range from 0 to 255 inclusive.
#   The escape sequence ^[0m returns output to default

SEPARATOR=':'

## kaldi_io_mechanisms.py
delta_command = "compute-mfcc-feats --config=conf/mfcc.conf scp,p:wav_test.scp ark:- | add-deltas ark:- ark:- |"
delta_feats_rspecifier = (
     f'ark:{delta_command}'
  )

mfcc_command = "compute-mfcc-feats --config=conf/mfcc.conf scp,p:wav_test.scp ark:- |"
mfcc_feats_rspecifier = (
     f'ark:{mfcc_command}'
  )

## read_wav_pcm.py
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
# File              : read_wav_pcm.py
# Author            : Meng Wei <wmeng94@gmail.com>
# Date              : 23.03.2023
# Last Modified Date: 23.03.2023
# Last Modified By  : Meng Wei <wmeng94@gmail.com>

import librosa
import numpy as np

## mngw-w64_boost.MD

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                weimeng23
                / mngw-w64_boost.MD
            
            
              Created
              February 26, 2022 06:33
                — forked from zrsmithson/mngw-w64_boost.MD
            
              
                Installing boost on Windows using MinGW-w64 (gcc 64-bit)
              
          
    Installing boost on Windows using MinGW-w64 (gcc 64-bit)

Introduction

Boost is easy when you are using headers or pre-compiled binaries for visual studio, but it can be a pain to compile from source on windows, especially when you want the 64-bit version of MinGW to use gcc/g++. This installation process should be thorough enough to simply copy and paste commands, but robust enough to install everything you need.
Note: if you need to install any of the libraries that need dependencies, see this great answer from stack overflow
Get files needed for install

Get the MinGW installer mingw-w64-install.exe from Sourceforge

Get the boost_1_68_0.zip source from Sourceforge

__Note: This should work perfectly w

  
## DeepLearningPapers.md

      
              23 files
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                weimeng23
                / DeepLearningPapers.md
            
            
              Created
              August 23, 2021 09:06
                — forked from wael34218/DeepLearningPapers.md
            
          
    05/05/2018

2018: Speech2Vec: A Sequence-to-Sequence Framework for Learning Word Embeddings from Speech

Projects audio files that contains one word of speech into a hyper-dimension space just like Word2Vec. Uses "Force Aligment" to split audio into words (which requires text). Pad the audio segments with zeros, do MFCC, feed into encoder-decoder which uses RMSE. They also add noise to the signal and make the network denoise it. LibriSpeech 500 hour of audio.
Not sure how it can incorporated in an ASR or TTS systems. The audio file has to be paired with a text otherwise Speech2Vec cannot split the audio file into words using "Forced Alignment" method.
It is used to query if the spoken word is similar to an existing word in the corpus.
2016: Neural Machine Translation of Rare Words with Subword Units (BPE)

BPE data compression tool that combines most frequent pair of bytes with one. It works well with Named Entity, loadwords and morphologically complex words. Handles OOVs well and rare words. You can
	cmake_minimum_required(VERSION 3.14 FATAL_ERROR)

	# 设置项目名称
	project(LearnCmake VERSION 1.0 LANGUAGES CXX)

	# 添加可执行文件
	add_library(add STATIC add.cc)

	add_executable(main main.cc)
	wget https://github.com/bminor/glibc/archive/refs/tags/glibc-2.35.tar.gz
	tar xvf glibc-2.35.tar.gz
	cd glibc-glibc-2.35
	mkdir build
	cd build
	../configure --prefix=/path/to/install
	make -j10
	make install
	logger = logging.getLogger(__name__)
	logger.setLevel(level=logging.DEBUG)

	formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
	formatter = logging.Formatter('%(asctime)s \| %(levelname)s \| %(filename)s \| %(threadName)s \| %(funcName)s \| %(lineno)s \| %(message)s')

	fh = logging.FileHandler("log.txt")
	fh.setLevel(logging.INFO)
	fh.setFormatter(formatter)
	logger.addHandler(fh)
	class MyBertForSequenceClassification(BertForSequenceClassification):
	def forward(self, input_ids=None, attention_mask=None, token_type_ids=None):
	outputs = super().forward(
	input_ids=input_ids,
	attention_mask=attention_mask,
	token_type_ids=token_type_ids,
	)
	return outputs.logits
	{
	"$schema": "https://raw.githubusercontent.com/JanDeDobbeleer/oh-my-posh/main/themes/schema.json",
	"palette": {
	"white": "#FFFFFF",
	"tan": "#CC3802",
	"teal": "#047E84",
	"plum": "#9A348E",
	"blush": "#DA627D",
	"salmon": "#FCA17D",
	"sky": "#86BBD8",
	#!/bin/bash
	#
	# This file echoes four gradients with 24-bit color codes
	# to the terminal to demonstrate their functionality.
	# The foreground escape sequence is ^[38;2;<r>;<g>;<b>m
	# The background escape sequence is ^[48;2;<r>;<g>;<b>m
	# <r> <g> <b> range from 0 to 255 inclusive.
	# The escape sequence ^[0m returns output to default

	SEPARATOR=':'
	delta_command = "compute-mfcc-feats --config=conf/mfcc.conf scp,p:wav_test.scp ark:- \| add-deltas ark:- ark:- \|"
	delta_feats_rspecifier = (
	f'ark:{delta_command}'
	)

	mfcc_command = "compute-mfcc-feats --config=conf/mfcc.conf scp,p:wav_test.scp ark:- \|"
	mfcc_feats_rspecifier = (
	f'ark:{mfcc_command}'
	)
	#!/usr/bin/env python3
	# -- coding: utf-8 --
	# File : read_wav_pcm.py
	# Author : Meng Wei <wmeng94@gmail.com>
	# Date : 23.03.2023
	# Last Modified Date: 23.03.2023
	# Last Modified By : Meng Wei <wmeng94@gmail.com>

	import librosa
	import numpy as np