{ "cells": [ { "cell_type": "code", "execution_count": 55, "id": "6ee294dd-020e-417f-97a1-628ab8be56c6", "metadata": {}, "outputs": [], "source": [ "import rpy2\n", "import pdb,sys,os\n", "from junlib.File import *\n", "import pandas as pd\n", "import pyreadr\n", "import numpy as np\n", "from junlib.BioUtils import BioList\n", "import scipy.io,scipy.sparse\n", "from scipy.sparse import csc_matrix" ] }, { "cell_type": "code", "execution_count": 2, "id": "b65982ed-74e8-459f-9447-ca0e4022422c", "metadata": {}, "outputs": [], "source": [ "ex=TabFile(\"treutlein2016_2\").read(\"\\t\")" ] }, { "cell_type": "code", "execution_count": 18, "id": "bebed5d6-4e30-491f-a349-6ab51aff6c34", "metadata": {}, "outputs": [], "source": [ "Genes=ex[0][3:]\n", "Cells=[item[0:3] for item in ex[1:]]\n", "Matrix=[item[3:] for item in ex[1:]]" ] }, { "cell_type": "code", "execution_count": 4, "id": "f63ab962-4b4d-414e-8915-1c03ee8f80b5", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "['1_iN2_C02', '0', 'MEF']" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "Cells[0]" ] }, { "cell_type": "code", "execution_count": 5, "id": "9b193544-9221-4800-921f-1aed6b0c9afe", "metadata": {}, "outputs": [], "source": [ "df_Cells=pd.DataFrame(index=[item[0] for item in Cells],data=Cells,columns=['Cell','Time','Label'])" ] }, { "cell_type": "code", "execution_count": null, "id": "75647449-ab11-4474-96e4-a66fcfa2588d", "metadata": {}, "outputs": [], "source": [] }, { "cell_type": "code", "execution_count": 6, "id": "f30e5236-dea6-45ec-9aec-c631e60aa7ea", "metadata": {}, "outputs": [], "source": [ "pyreadr.write_rds(\"Cells.Rds\", df_Cells)" ] }, { "cell_type": "code", "execution_count": 7, "id": "82957d3c-18f3-4cef-8d5b-98077904c60a", "metadata": {}, "outputs": [], "source": [ "df_Genes=pd.DataFrame(data=Genes,columns=['Gene'],index=Genes)" ] }, { "cell_type": "code", "execution_count": 8, "id": "982de120-b220-4cbd-96e0-0f764d7765ea", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "11835" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "len(Matrix[0])" ] }, { "cell_type": "code", "execution_count": 9, "id": "bdef33fc-77b9-4d6e-848c-9263b582480d", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Gene | \n", "
---|---|
0610007C21Rik | \n", "0610007C21Rik | \n", "
0610007L01Rik | \n", "0610007L01Rik | \n", "
0610007N19Rik | \n", "0610007N19Rik | \n", "
0610007P08Rik | \n", "0610007P08Rik | \n", "
0610007P14Rik | \n", "0610007P14Rik | \n", "
... | \n", "... | \n", "
Zyx | \n", "Zyx | \n", "
Zzef1 | \n", "Zzef1 | \n", "
Zzz3 | \n", "Zzz3 | \n", "
l7Rn6 | \n", "l7Rn6 | \n", "
rtTA | \n", "rtTA | \n", "
11835 rows × 1 columns
\n", "\n", " | 1_iN2_C02 | \n", "1_iN2_C05 | \n", "1_iN2_C07 | \n", "1_iN2_C08 | \n", "1_iN2_C09 | \n", "1_iN2_C12 | \n", "1_iN2_C13 | \n", "1_iN2_C14 | \n", "1_iN2_C15 | \n", "1_iN2_C16 | \n", "... | \n", "1ggM_iN4_C76 | \n", "1ggM_iN4_C83 | \n", "1ggM_iN4_C85 | \n", "1ggS_iN4_C10 | \n", "1ggS_iN4_C13 | \n", "1ggS_iN4_C67 | \n", "1gL_iN4_C02 | \n", "1gL_iN4_C31 | \n", "1gL_iN4_C39 | \n", "1gM_iN4_C42 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0610007C21Rik | \n", "6.34167633593164 | \n", "4.95994469222165 | \n", "0 | \n", "4.69753105419149 | \n", "6.60915211004153 | \n", "6.74946434712868 | \n", "0 | \n", "4.89686059774015 | \n", "7.15097620794178 | \n", "3.27141502017117 | \n", "... | \n", "5.78129647062759 | \n", "5.97223032419806 | \n", "4.74779004418384 | \n", "6.48528414489047 | \n", "8.55296506786842 | \n", "2.41537525574661 | \n", "6.48903675234239 | \n", "7.40922896532355 | \n", "4.1287063120705 | \n", "6.61612668319865 | \n", "
0610007L01Rik | \n", "0 | \n", "6.23143166056305 | \n", "0 | \n", "3.06291193876294 | \n", "6.62797584725158 | \n", "0 | \n", "5.58661648740854 | \n", "1.31693501715475 | \n", "2.41201070412151 | \n", "4.70269246804867 | \n", "... | \n", "0.754359626243285 | \n", "0 | \n", "4.19029341650084 | \n", "0 | \n", "2.50004437918514 | \n", "6.72515587274112 | \n", "4.40442416645675 | \n", "5.10771074049084 | \n", "0 | \n", "0 | \n", "
0610007N19Rik | \n", "0 | \n", "0 | \n", "3.88899086305825 | \n", "0 | \n", "5.55986798002719 | \n", "0 | \n", "1.55608874897096 | \n", "1.48335577825169 | \n", "0 | \n", "3.55424048563973 | \n", "... | \n", "4.99616229084016 | \n", "0 | \n", "0 | \n", "3.85089831294737 | \n", "0 | \n", "0 | \n", "4.18427713031916 | \n", "4.00900586563456 | \n", "0 | \n", "4.2097714690844 | \n", "
0610007P08Rik | \n", "0 | \n", "0 | \n", "0.041368356292466 | \n", "0 | \n", "3.247370259674 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0.142924985049315 | \n", "0 | \n", "0 | \n", "0 | \n", "2.3112007267365 | \n", "0 | \n", "0 | \n", "5.13145556233943 | \n", "
0610007P14Rik | \n", "5.69038265654589 | \n", "6.05501872589075 | \n", "5.53021647396939 | \n", "0.693763883119321 | \n", "6.67374167221402 | \n", "6.19166034426733 | \n", "6.22603583215095 | \n", "7.23003191689867 | \n", "6.40741616227404 | \n", "7.31172597492533 | \n", "... | \n", "0 | \n", "4.15959656397144 | \n", "3.82158466918684 | \n", "0 | \n", "0 | \n", "0 | \n", "4.45912999274342 | \n", "3.43074049497696 | \n", "4.58087193717366 | \n", "7.49525945442237 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
Zyx | \n", "1.68217081808919 | \n", "5.83847642850374 | \n", "2.61446606655115 | \n", "7.46419567892784 | \n", "7.93359175129272 | \n", "3.94400039784829 | \n", "6.83236707003029 | \n", "3.80992399117742 | \n", "7.56368677291249 | \n", "4.35961428372074 | \n", "... | \n", "6.89643568617355 | \n", "4.53777172700827 | \n", "0 | \n", "4.62437602762411 | \n", "2.0189608276121 | \n", "0.539820437720234 | \n", "4.96591667762543 | \n", "7.19014075266198 | \n", "6.09971545157864 | \n", "6.06130415583606 | \n", "
Zzef1 | \n", "1.13929161597511 | \n", "0 | \n", "2.14584563945167 | \n", "3.40758812269554 | \n", "1.93392424186095 | \n", "0.738831625223013 | \n", "0 | \n", "0.641061008770318 | \n", "0 | \n", "2.3670933216363 | \n", "... | \n", "0 | \n", "0 | \n", "1.43660286051722 | \n", "1.26416417915575 | \n", "3.86510503648837 | \n", "0 | \n", "0.0192430133830156 | \n", "0 | \n", "0 | \n", "3.27570987739765 | \n", "
Zzz3 | \n", "0 | \n", "3.64217030902425 | \n", "3.86499003785313 | \n", "0 | \n", "0 | \n", "2.58483826411844 | \n", "3.12161144139684 | \n", "0.283545988272131 | \n", "2.26862930569997 | \n", "3.15643281728014 | \n", "... | \n", "2.31685707660686 | \n", "0 | \n", "0 | \n", "2.9157611264727 | \n", "4.59389572902205 | \n", "0 | \n", "0.975105751693184 | \n", "0 | \n", "1.62308812679231 | \n", "4.26004685209986 | \n", "
l7Rn6 | \n", "2.06522810329743 | \n", "5.09243041360646 | \n", "1.98971987695061 | \n", "3.99545134551551 | \n", "3.62795149221342 | \n", "6.55105953717305 | \n", "6.41611931130928 | \n", "6.11369119626157 | \n", "6.34813932675448 | \n", "6.12916286074585 | \n", "... | \n", "2.53671173242399 | \n", "4.98835913913751 | \n", "5.21666625158915 | \n", "0 | \n", "5.7821069729385 | \n", "0 | \n", "4.75277032441183 | \n", "5.68148201446647 | \n", "0 | \n", "4.54152040770032 | \n", "
rtTA | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "6.21058960912856 | \n", "7.61238696795978 | \n", "6.48015965083557 | \n", "5.40573243922186 | \n", "7.84870612349304 | \n", "5.95816207481279 | \n", "0 | \n", "0 | \n", "5.62104404452778 | \n", "0 | \n", "
11835 rows × 252 columns
\n", "