Discard reports without overrepresented sequences
This commit is contained in:
parent
e59683b925
commit
52eaee4568
|
@ -14,8 +14,9 @@ def extract_adapters(files) -> Tuple[Series, List]:
|
|||
all_adapters = DataFrame()
|
||||
for entry in files:
|
||||
tables = read_html(entry)
|
||||
adapter_sequences = tables[1].Sequence
|
||||
all_adapters = all_adapters.append(adapter_sequences)
|
||||
if len(tables) > 1:
|
||||
adapter_sequences = tables[1].Sequence
|
||||
all_adapters = all_adapters.append(adapter_sequences)
|
||||
processed_adapters = preprocess_dataframe(all_adapters)
|
||||
stats = [
|
||||
processed_adapters.str.len().mean(),
|
||||
|
|
Loading…
Reference in New Issue