http://elegantcode.com/2011/06/18/git-on-windows-creating-a-network-shared-central-repository/
pushd \\remoteServer\git\Share\Folder\Path
sudo apt autoremove openvswitch-common openvswitch-switch-dpdk openvswitch-dbg openvswitch-pki openvswitch-ipsec openvswitch-switch openvswitch-switch-dpdk openvswitch-ipsec openvswitch-test openvswitch-testcontroller openvswitch-vtep
wget http://openvswitch.org/releases/openvswitch-2.4.0.tar.gz
# This isn't supposed to run as a bash script, i named it with ".sh" for syntax highlighting. | |
# https://developer.nvidia.com/nsight-systems | |
# https://docs.nvidia.com/nsight-systems/profiling/index.html | |
# My preferred nsys (command line executable used to create profiles) commands | |
# | |
# In your script, write | |
# torch.cuda.nvtx.range_push("region name") | |
# ... |
set-option -sa terminal-overrides ",xterm*:Tc" | |
set -g mouse on | |
unbind C-b | |
set -g prefix C-t | |
bind C-t send-prefix | |
# List of plugins | |
# this requires install tpm |
-- Install packer | |
local install_path = vim.fn.stdpath 'data' .. '/site/pack/packer/start/packer.nvim' | |
local is_bootstrap = false | |
if vim.fn.empty(vim.fn.glob(install_path)) > 0 then | |
is_bootstrap = true | |
vim.fn.system { 'git', 'clone', '--depth', '1', 'https://github.com/wbthomason/packer.nvim', install_path } | |
vim.cmd [[packadd packer.nvim]] | |
end | |
require('packer').startup(function(use) |
""" | |
call to _all_gather_base with c10d._coalescing_manager | |
Test command: | |
mpirun -np $1 -N ${ndev_per_node} --hostfile ${HOST_FILE} \ | |
--mca plm_rsh_no_tree_spawn 1 \ | |
-mca btl tcp,self --mca btl_tcp_if_exclude lo,docker0 \ | |
--mca pml ^cm \ | |
-bind-to none \ | |
--tag-output \ | |
-x LD_LIBRARY_PATH=$LD_LIBRARY_PATH \ |
// CUDA runtime | |
#include <cuda_runtime.h> | |
#include <cuda.h> | |
#include <cassert> | |
#include <iostream> | |
#include <memory> | |
#include <thread> | |
#include <atomic> |
diff --git a/csrc/lamb/fused_lamb_cuda_kernel.cu b/csrc/lamb/fused_lamb_cuda_kernel.cu | |
index e934b69c..207faa39 100644 | |
--- a/csrc/lamb/fused_lamb_cuda_kernel.cu | |
+++ b/csrc/lamb/fused_lamb_cuda_kernel.cu | |
@@ -8,7 +8,7 @@ | |
#include "ATen/cuda/CUDAContext.h" | |
#include "ATen/cuda/detail/IndexUtils.cuh" | |
//#include "ATen/Type.h" | |
-#include <THC/THCGeneral.h> | |
+// #include <THC/THCGeneral.h> |
diff --git a/csrc/lamb/fused_lamb_cuda_kernel.cu b/csrc/lamb/fused_lamb_cuda_kernel.cu | |
index 0448a45..ff87993 100644 | |
--- a/csrc/lamb/fused_lamb_cuda_kernel.cu | |
+++ b/csrc/lamb/fused_lamb_cuda_kernel.cu | |
@@ -464,7 +464,7 @@ void fused_lamb_cuda(at::Tensor& p, | |
lamb_coeff.data<scalar_t>()); | |
})); | |
} | |
- THCudaCheck(cudaGetLastError()); | |
+ AT_CUDA_CHECK(cudaGetLastError()); |