Skip to content

Commit

Permalink
Merge pull request #58 from phenoscape/balhoff-patch-1
Browse files Browse the repository at this point in the history
Remove matplotlib from regression.py
  • Loading branch information
balhoff authored Apr 17, 2020
2 parents 50fea5d + ef99d00 commit de645c0
Showing 1 changed file with 1 addition and 30 deletions.
31 changes: 1 addition & 30 deletions src/regression.py
Original file line number Diff line number Diff line change
Expand Up @@ -116,44 +116,15 @@ def reg_m(scores, sizes):
X = sm.add_constant(np.column_stack((ele, X)))
results = sm.OLS(scores, X).fit()
return results


def plot_residuals(corpus_profile_sizes, query_profile_sizes, scores, corpus_coeff, query_coeff, constant):
query_axis = []
corpus_axis = []
residuals = []
count = 0
mean = np.mean(scores)

for i in range(0, len(scores)):
query_size = query_profile_sizes[i]
corpus_size = corpus_profile_sizes[i]
actualscore = scores[i]
corpus_axis.append(corpus_size)
query_axis.append(query_size)
predictedscore = constant + (corpus_coeff * corpus_size) + (query_coeff * query_size)
residual = actualscore - predictedscore
residuals.append(residual)

plt.scatter(np.array(query_axis), np.array(residuals))
plt.xlabel('Log(Query Profile Size)')
plt.ylabel('Residual')
plt.savefig('ResidualPlot_QuerySizes.png')

plt.scatter(np.array(corpus_axis), np.array(residuals))
plt.xlabel('Log(Corpus Profile Size)')
plt.ylabel('Residual')
plt.savefig('ResidualPlot_CorpusSizes.png')


if __name__=='__main__':
import sys
import os
from statsmodels.stats.outliers_influence import OLSInfluence
import math
import matplotlib.pyplot as plt
import numpy as np
import statsmodels.api as sm
import statsmodels.stats.api as sms
from scipy import stats
main()
main()

0 comments on commit de645c0

Please sign in to comment.