Deepayan Deepayan137

## cost_new.py
import sys
import os
from ocr import GravesOCR
from postproc.dictionary import Dictionary
from parser import read_book
import json
from cost_model import CostModel
from timekeep import Timer
from parser.convert import page_to_unit
import parser.webtotrain as webtotrain

## cost_est.py
def cost_model(**kwargs):
    tc, sc = 15, 5
    #method = kwargs['method']
    in_dictionary = kwargs['included']
    not_in_dictionary = kwargs['excluded']

    if in_dictionary:
        return tc*not_in_dictionary + sc*in_dictionary
    else:
        return tc*not_in_dictionary

## image_deblurring.py
import cv2
import argparse
import numpy as np
import cmath
import pdb
import numpy.matlib
from math import e
ap = argparse.ArgumentParser()
ap.add_argument("-i", "--image1", required=True, help="Path to the image")
args = vars(ap.parse_args())

## Praveen_k-nearest.py
from doctools.cluster.mst import cluster
from doctools.cluster.distance import jaccard, lev, euc
from doctools.parser.convert import page_to_unit
from doctools.parser import webtotrain
from argparse import ArgumentParser
from pprint import pprint
from .dot import as_dot
import json
from functools import partial
import pdb

## cbow_model.py
class MyCbow():
    def __init__(self, vocab_size, embedding_size):
        super(MyCbow, self).__init__()
        self.w1 = self.initialize(vocab_size, embedding_size)
        self.w2 = self.initialize(embedding_size, vocab_size)
        self.w1_grad= 0
        self.w2_grad = 0
        self.embedding = None
        self.x = None
    def set_params(self, w):

## gravesOCR.py
import os
import subprocess
import glob
import numpy as np
import cv2
import sys
import shutil
import pdb
def segmentation(path):
    for root, dirs, files in os.walk(path):

## model.py
import torch
import torch.nn as nn
import torch.nn.utils.rnn as rnn_utils

class DiscNet():
	def __init__(self, vocab_size, hidden_size, embedding_size, rnn_type, dropout=0.2):
		super(DiscNet, self).__init__()
		self.hidden_size = hidden_size
		self.embedding = nn.Embedding(vocab_size, embedding_size)
		self.rnn_type = rnn_type

## vggFace_downloader.py
import os
import requests
from PIL import Image
import pdb
from tqdm import *

data_path = '/home/saurabh/Facex/data/files'

class NotFound(BaseException):
	pass

## lec03.md

      
              1 file
            
          
              0 forks
            
          
              0 comments
            
          
              0 stars
            
          
                Deepayan137
                / lec03.md
            
            
              Last active
              August 9, 2018 14:32
            
              
                RMSE vs. MAE
              
          
    Root Mean Square error vs Mean Absolute Error


RMSE can be defined as a square root of summation over all i { [Yi -(W^T.Xi)]^2 }. We take square of the difference between predicted value and the real value before summing over in order to get rid of negative values, so that the positives and negatives don’t cancel each other out and we are left with an error which is much lesser than the actual error. We then proceed to find W by differentiating  the above loss function w.r.t W and equate it to zero.


However, it is interesting to note that we don’t have to necessarily take the square of the difference to get rid of the negative values. The same could be achieved by taking the absolute value of the difference between predicted and real values.  This is know as Mean Absolute Error or MAE. Summation over all i {abs [ Yi - (W^T.Xi)] }


One could argue that why do we take RMSE when MAE less computationally expensive.


The below link beautifully explains why we do that. Do give it a read.

  
## q7_1.py
import numpy as np
import random
import pdb
import os
import sys

def update(W, X_vec, n):
	W_new = W + n*X_vec
	return W_new
	import sys
	import os
	from ocr import GravesOCR
	from postproc.dictionary import Dictionary
	from parser import read_book
	import json
	from cost_model import CostModel
	from timekeep import Timer
	from parser.convert import page_to_unit
	import parser.webtotrain as webtotrain
	def cost_model(**kwargs):
	tc, sc = 15, 5
	#method = kwargs['method']
	in_dictionary = kwargs['included']
	not_in_dictionary = kwargs['excluded']

	if in_dictionary:
	return tcnot_in_dictionary + scin_dictionary
	else:
	return tc*not_in_dictionary
	import cv2
	import argparse
	import numpy as np
	import cmath
	import pdb
	import numpy.matlib
	from math import e
	ap = argparse.ArgumentParser()
	ap.add_argument("-i", "--image1", required=True, help="Path to the image")
	args = vars(ap.parse_args())
	from doctools.cluster.mst import cluster
	from doctools.cluster.distance import jaccard, lev, euc
	from doctools.parser.convert import page_to_unit
	from doctools.parser import webtotrain
	from argparse import ArgumentParser
	from pprint import pprint
	from .dot import as_dot
	import json
	from functools import partial
	import pdb
	class MyCbow():
	def __init__(self, vocab_size, embedding_size):
	super(MyCbow, self).__init__()
	self.w1 = self.initialize(vocab_size, embedding_size)
	self.w2 = self.initialize(embedding_size, vocab_size)
	self.w1_grad= 0
	self.w2_grad = 0
	self.embedding = None
	self.x = None
	def set_params(self, w):
	import os
	import subprocess
	import glob
	import numpy as np
	import cv2
	import sys
	import shutil
	import pdb
	def segmentation(path):
	for root, dirs, files in os.walk(path):
	import torch
	import torch.nn as nn
	import torch.nn.utils.rnn as rnn_utils

	class DiscNet():
	def __init__(self, vocab_size, hidden_size, embedding_size, rnn_type, dropout=0.2):
	super(DiscNet, self).__init__()
	self.hidden_size = hidden_size
	self.embedding = nn.Embedding(vocab_size, embedding_size)
	self.rnn_type = rnn_type
	import os
	import requests
	from PIL import Image
	import pdb
	from tqdm import *

	data_path = '/home/saurabh/Facex/data/files'

	class NotFound(BaseException):
	pass
	import numpy as np
	import random
	import pdb
	import os
	import sys

	def update(W, X_vec, n):
	W_new = W + n*X_vec
	return W_new