Apress
diff --git a/‎week_12_1/P.1_josephus_problem_II.ipynb
Lines changed: 142 additions & 0 deletions b/‎week_12_1/P.1_josephus_problem_II.ipynb
Lines changed: 142 additions & 0 deletions
diff --git a/‎week_12_1/codon2amino.py
Lines changed: 39 additions & 0 deletions b/‎week_12_1/codon2amino.py
Lines changed: 39 additions & 0 deletions
diff --git a/‎week_12_1/creating_edge_list.py
Lines changed: 20 additions & 0 deletions b/‎week_12_1/creating_edge_list.py
Lines changed: 20 additions & 0 deletions
diff --git a/‎week_12_1/find_overlaps.py
Lines changed: 25 additions & 0 deletions b/‎week_12_1/find_overlaps.py
Lines changed: 25 additions & 0 deletions
diff --git a/‎week_12_1/hi_lo_partial
Lines changed: 45 additions & 0 deletions b/‎week_12_1/hi_lo_partial
Lines changed: 45 additions & 0 deletions
diff --git a/‎week_12_1/highest_in-degree_stations_edge_list.sh
Lines changed: 1 addition & 0 deletions b/‎week_12_1/highest_in-degree_stations_edge_list.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎week_12_1/highest_out-degree_stations_edge_list.sh
Lines changed: 1 addition & 0 deletions b/‎week_12_1/highest_out-degree_stations_edge_list.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎week_12_1/most_frequent_specimens_hewitsoni_males.sh
Lines changed: 1 addition & 0 deletions b/‎week_12_1/most_frequent_specimens_hewitsoni_males.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎week_12_1/most_frequent_stations_hewitsoni_males.sh
Lines changed: 1 addition & 0 deletions b/‎week_12_1/most_frequent_stations_hewitsoni_males.sh
Lines changed: 1 addition & 0 deletions
diff --git a/‎week_12_1/number_of_specimens_in_edge_list.sh
Lines changed: 4 additions & 0 deletions b/‎week_12_1/number_of_specimens_in_edge_list.sh
Lines changed: 4 additions & 0 deletions
@@ -0,0 +1,142 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Josephus Problem"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The Josephus Problem is a counting problem, named after a historical event described by Flavius Josephus.\n",
+    "In the original form, 42 objects are placed in a circle; and starting from Object #1, every 3d object is removed.\n",
+    "We want to preserve the order in which the objects are removed; more specifically, \n",
+    "we want to know which objects are the second-to-last and last are removed."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "list(range(1,42))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# pseudo-code\n",
+    "\n",
+    "# create three lists, one for circle_of_objects, one for removed_objects, and one for the skip\n",
+    "circle_of_objects, removed_objects, skip = range(1,42), [], range(3)\n",
+    "\n",
+    "# while circle_of_objects == True\n",
+    "while circle_of_objects:\n",
+    "\n",
+    "    # for i <- skip-list reversed\n",
+    "    for i in skip[::-1]:\n",
+    "\n",
+    "        # dequeue the next object\n",
+    "\n",
+    "        # the logical structure of the following\n",
+    "        # if-else clause is not pythonic.\n",
+    "        # in python, we prefer: if someCollection:\n",
+    "        # meaning \"True as long as someCollection\n",
+    "        # contains an item\"\n",
+    "        # let's refactor to clause.\n",
+    "        \n",
+    "        # if i == 0\n",
+    "\n",
+    "            # append next object to removed_objects list\n",
+    "            \n",
+    "        # else\n",
+    "        \n",
+    "            # append next object to circle_of_objects list\n",
+    "            \n",
+    "            \n",
+    "# print removed_objects list\n",
+    "removed_objects"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for i in skip[::-1]:\n",
+    "    print(i)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "\n",
+       "        <iframe\n",
+       "            width=\"950\"\n",
+       "            height=\"800\"\n",
+       "            src=\"https://mathworld.wolfram.com/images/eps-gif/Josephus41-3_1000.gif\"\n",
+       "            frameborder=\"0\"\n",
+       "            allowfullscreen\n",
+       "        ></iframe>\n",
+       "        "
+      ],
+      "text/plain": [
+       "<IPython.lib.display.IFrame at 0x7f4f78309a90>"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from IPython.display import IFrame\n",
+    "IFrame('https://mathworld.wolfram.com/images/eps-gif/Josephus41-3_1000.gif', width=950, height=800)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from IPython.display import IFrame\n",
+    "IFrame('https://en.wikipedia.org/wiki/Josephus_problem', width=950, height=800)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
@@ -0,0 +1,39 @@
+import pickle
+import os
+def get_amino_acid(nuclStr: str, codon2amino: dict=None, path_to_pickled_dict: str=''):
+    ''' Requires either codon2amino dict passed into function,
+        or path to pickled codon2amino dict file passed into it.
+        Returns tuple of amino-acid strings for three reading frames.
+        >>>get_amino_acid('GATTACAGATTACA', codon2amino)
+        ('AspTyrArgLeu', 'IleThrAspTyr', 'LeuGlnIleThr')
+    '''
+    # garbage filters
+    # to do: garbage filter to ensure nuclStr is clean
+    assert codon2amino or os.path.isfile(path_to_pickled_dict),\
+        "function must have dict passed into it, or dict must exist to pickle dir"
+    if not codon2amino and os.path.isfile(path_to_pickled_dict):
+        with open(path_to_pickled_dict, 'rb') as inFile:
+            codon2amino = pickle.load(inFile)
+    # implementation of algorithm
+    # assuming nuclStr is clean AND
+    # dict may be incomplete or have bad items
+    # initialization
+    nuclStr = nuclStr.upper()
+    rf0, rf1, rf2 = '', '', ''
+    
+    for index, value in enumerate(nuclStr[:-2]):
+        remainder = index % 3
+        codon = nuclStr[index:index+3]
+        try:
+            amino = codon2amino[codon]
+        except KeyError as e:
+            raise Exception(f"Codon {codon} not found in codon2amino dict.\n" \
+                  f"\tPlease check dictionary for item and codon used as key.") \
+                  from e
+        if remainder == 0:
+            rf0 = rf0 + amino
+        elif remainder == 1:
+            rf1 = rf1 + amino
+        else:
+            rf2 = rf2 + amino
+    return rf0, rf1, rf2
@@ -0,0 +1,20 @@
+# first, we read the contents
+# of the hewitsoni_males datafile
+# into an LoL in session memory
+with open('datafile/hewitsoni_males.txt') as inFile:
+    LoS = inFile.read().splitlines()
+    LoL = [] # initialization
+    for record in LoS:
+        LoL.append(record.split())
+
+# then we write out an edge list from the LoL
+with open('datafile/edge_list', 'w') as outFile:
+    # we shorten the range object by 1
+    # to prevent an IndexError
+    for index in range(len(LoL)-1):
+        if LoL[index][0] == LoL[index+1][0]:
+            edge_record = (f"{LoL[index][0]}\t"
+                           f"{LoL[index][1]}\t"
+                           f"{LoL[index+1][1]}\n")
+            outFile.write(edge_record)
+
@@ -0,0 +1,25 @@
+with open('datafile/finding_interval_overlaps/exon.bed', 'r') as exonFile,\:
+with open('datafile/finding_interval_overlaps/test.sort.bed', 'r') as testFile:
+    exonLoS, testLoS = exonFile.read().splitlines(),\
+                       testFile.read().splitlines()
+    exonLoL, testLoL = [], []
+    for exonRec in exonLoS:
+        exonLoL.append(exonRec.split('\t'))
+    for testRec in testLoS:
+        LoL.append(testRec.split())
+
+with open('overlaps', 'w') as outFile:
+    for testRec in testLoL:
+        for exonRec in exonLoL:
+            if testRec[0] == exonRec[0]\
+                and len(testRec) > 3\
+                and range(max(int(testRec[1]), int(exonRec[1])),\
+                          min(int(testRec[2]), int(exonRec[2]))+1):
+                overlap = range(max(int(testRec[1]), int(exonRec[1])),\
+                          min(int(testRec[2]), int(exonRec[2]))+1)
+                record = (f"{exonRec[0]}\t{overlap[0]}\t"
+                          f"{overlap[-1]}\t{exonRec[3]}\t"
+                          f"{testRec[3]}\n")
+                outFile.write(record)
+        
+        
@@ -0,0 +1,45 @@
+#!/usr/bin/python3
+
+# we assume a fair player.
+
+import math
+
+# in this interactive while loop, the script explains the game, gets highest integer of range from user;
+# and initializes floor and ceiling variables
+while True:
+    print("in this game you give me a range of integers from 1 to some number you choose." + '\n' +
+    "then you will pick a number within this range for me to guess." + '\n' +
+    "i will try to guess your number in the fewest number of tries." + '\n' +
+    "for each guess, you will tell me if your number is higher than (h)," + '\n' +
+    "lower than (l), or equal to (=) your number. ready?" + '\n')
+
+    floor = 1
+    ceiling = input("please enter the highest number of your range: ")
+    ceiling = int(ceiling)
+
+    # remember that the 'break' statement lets the program counter
+    # leave the innermost loop structure that it's in.
+    # that how we 'break out' of the infinite loop.
+    # 'continue' is related to 'break' ---
+    # it returns the program counter to the top of the while loop.
+    if not isinstance(ceiling, int) and\
+       not ceiling > 1:
+        print("that's not a legitimate value. please enter a counting number greater than 1.")
+        continue
+    else:
+        break
+# print the challenge of fewest guesses using this algorithm
+# use math.ceil() and math.log() functions
+
+print(f"i can guess your number in at most {nguesses} guesses!\n")
+# initalize the guess counter
+guessCnt = 0
+while True:
+    guessCnt = guessCnt + 1
+    guess = (floor + ceiling)//2
+
+    answer = input("i guess " + str(guess) + "! Is your number higher (h), lower (l), or equal (=)? ")
+
+    # RUMPELSTILTSKIN LINES
+    # several if-statements, each processing different user input
+
@@ -0,0 +1 @@
+gawk -F"\t" '{print $2}' datafile/edge_list | sort | uniq -c | sort -n | tail
@@ -0,0 +1 @@
+gawk -F"\t" '{print $3}' datafile/edge_list | sort | uniq -c | sort -n | tail
@@ -0,0 +1 @@
+gawk -F"\t" '{print $1}' datafile/hewitsoni_males.txt | uniq -c | sort -n | tail
@@ -0,0 +1 @@
+gawk -F"\t" '{print $2}' datafile/hewitsoni_males.txt | uniq -c | sort -n | tail
@@ -0,0 +1,4 @@
+# returns the number of specimens that made it into edge list
+gawk -F"\t" '{print $1}' "$HOME"/datafile/edge_list |# extract column 1
+uniq |# return a single instance of each contiguous identical group of specimens
+wc -l # return the number of specimens
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+gawk -F"\t" '{print $2}' datafile/edge_list \| sort \| uniq -c \| sort -n \| tail`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+gawk -F"\t" '{print $3}' datafile/edge_list \| sort \| uniq -c \| sort -n \| tail`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+gawk -F"\t" '{print $1}' datafile/hewitsoni_males.txt \| uniq -c \| sort -n \| tail`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+gawk -F"\t" '{print $2}' datafile/hewitsoni_males.txt \| uniq -c \| sort -n \| tail`