Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
C
courseML_phd2023
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Wiki
Requirements
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Locked files
Build
Pipelines
Jobs
Pipeline schedules
Test cases
Artifacts
Deploy
Releases
Package registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Code review analytics
Issue analytics
Insights
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
GitLab community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
GILSON Matthieu
courseML_phd2023
Commits
2ca73268
Commit
2ca73268
authored
2 years ago
by
GILSON Matthieu
Browse files
Options
Downloads
Patches
Plain Diff
Upload New File
parent
e9e9c186
Loading
Loading
No related merge requests found
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
data_time_series/test_classif_data.ipynb
+158
-0
158 additions, 0 deletions
data_time_series/test_classif_data.ipynb
with
158 additions
and
0 deletions
data_time_series/test_classif_data.ipynb
0 → 100644
+
158
−
0
View file @
2ca73268
{
"cells": [
{
"cell_type": "code",
"execution_count": 6,
"id": "349c8bc6-1a18-4fe2-869c-5581df684b1c",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"import numpy as np\n",
"import pandas as pd\n",
"\n",
"from sktime.datasets import load_from_arff_to_dataframe\n",
"\n",
"import matplotlib.pyplot as plt"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "47021efb-21dc-4ed2-8375-de1355344a16",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"#dataset = 'FordA'\n",
"dataset = 'Cricket'\n",
"#dataset = 'Phoneme'\n",
"\n",
"X_train, y_train = load_from_arff_to_dataframe('{0}/{0}_TRAIN.arff'.format(dataset))\n",
"X_test, y_test = load_from_arff_to_dataframe('{0}/{0}_TEST.arff'.format(dataset))"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "ea059511-2df8-447e-a064-ab23a2d4b6f5",
"metadata": {
"tags": []
},
"outputs": [
{
"data": {
"image/png": "",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"plt.figure()\n",
"plt.plot(X_train.iloc[0,0])\n",
"plt.xlabel('time')\n",
"plt.ylabel('a.u.')\n",
"plt.title('example trace')\n",
"\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "5f1297d0-e59b-46ef-bd1c-2c974b7b2fbd",
"metadata": {
"tags": []
},
"outputs": [],
"source": [
"X_mean_train = pd.DataFrame(columns=['mean'])\n",
"for i in range(X_train.shape[0]):\n",
" X_mean_train = pd.concat((X_mean_train, \n",
" pd.DataFrame({'mean': X_train.iloc[i,0].mean()}, index=[0])), ignore_index=True)\n",
" \n",
"X_mean_test = pd.DataFrame(columns=['mean'])\n",
"for i in range(X_test.shape[0]):\n",
" X_mean_test = pd.concat((X_mean_test, \n",
" pd.DataFrame({'mean': X_test.iloc[i,0].mean()}, index=[0])), ignore_index=True)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "656566da-5f08-414a-90d5-274ed35f0b73",
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"(108, 1) (108,)\n",
"['1.0' '10.0' '11.0' '12.0' '2.0' '3.0' '4.0' '5.0' '6.0' '7.0' '8.0'\n",
" '9.0']\n"
]
}
],
"source": [
"print(X_mean_train.shape, y_train.shape)\n",
"\n",
"print(np.unique(y_train))"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "ad8ea31a-e7af-45a7-b6f0-091b51d82db3",
"metadata": {
"tags": []
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"0.08333333333333333\n"
]
}
],
"source": [
"from sklearn.linear_model import LogisticRegression\n",
"\n",
"lr = LogisticRegression()\n",
"\n",
"lr.fit(X_mean_train, y_train)\n",
"\n",
"print(lr.score(X_mean_test, y_test))"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.10"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
%% Cell type:code id:349c8bc6-1a18-4fe2-869c-5581df684b1c tags:
```
python
import
numpy
as
np
import
pandas
as
pd
from
sktime.datasets
import
load_from_arff_to_dataframe
import
matplotlib.pyplot
as
plt
```
%% Cell type:code id:47021efb-21dc-4ed2-8375-de1355344a16 tags:
```
python
#dataset = 'FordA'
dataset
=
'
Cricket
'
#dataset = 'Phoneme'
X_train
,
y_train
=
load_from_arff_to_dataframe
(
'
{0}/{0}_TRAIN.arff
'
.
format
(
dataset
))
X_test
,
y_test
=
load_from_arff_to_dataframe
(
'
{0}/{0}_TEST.arff
'
.
format
(
dataset
))
```
%% Cell type:code id:ea059511-2df8-447e-a064-ab23a2d4b6f5 tags:
```
python
plt
.
figure
()
plt
.
plot
(
X_train
.
iloc
[
0
,
0
])
plt
.
xlabel
(
'
time
'
)
plt
.
ylabel
(
'
a.u.
'
)
plt
.
title
(
'
example trace
'
)
plt
.
show
()
```
%% Output
%% Cell type:code id:5f1297d0-e59b-46ef-bd1c-2c974b7b2fbd tags:
```
python
X_mean_train
=
pd
.
DataFrame
(
columns
=
[
'
mean
'
])
for
i
in
range
(
X_train
.
shape
[
0
]):
X_mean_train
=
pd
.
concat
((
X_mean_train
,
pd
.
DataFrame
({
'
mean
'
:
X_train
.
iloc
[
i
,
0
].
mean
()},
index
=
[
0
])),
ignore_index
=
True
)
X_mean_test
=
pd
.
DataFrame
(
columns
=
[
'
mean
'
])
for
i
in
range
(
X_test
.
shape
[
0
]):
X_mean_test
=
pd
.
concat
((
X_mean_test
,
pd
.
DataFrame
({
'
mean
'
:
X_test
.
iloc
[
i
,
0
].
mean
()},
index
=
[
0
])),
ignore_index
=
True
)
```
%% Cell type:code id:656566da-5f08-414a-90d5-274ed35f0b73 tags:
```
python
print
(
X_mean_train
.
shape
,
y_train
.
shape
)
print
(
np
.
unique
(
y_train
))
```
%% Output
(108, 1) (108,)
['1.0' '10.0' '11.0' '12.0' '2.0' '3.0' '4.0' '5.0' '6.0' '7.0' '8.0'
'9.0']
%% Cell type:code id:ad8ea31a-e7af-45a7-b6f0-091b51d82db3 tags:
```
python
from
sklearn.linear_model
import
LogisticRegression
lr
=
LogisticRegression
()
lr
.
fit
(
X_mean_train
,
y_train
)
print
(
lr
.
score
(
X_mean_test
,
y_test
))
```
%% Output
0.08333333333333333
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment