Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Test ci #48

Closed
wants to merge 23 commits into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
23 commits
Select commit Hold shift + click to select a range
ef8c48d
renamed a few test files.
brettwebst Apr 6, 2024
e4b1bfb
Merge pull request #2 from brettwebst/issue-32-add-dropna-test
brettwebst Apr 6, 2024
507e601
Merge branch 'SciSharp:master' into master
brettwebst Apr 6, 2024
c99194b
Merge branch 'SciSharp:master' into master
brettwebst Apr 6, 2024
8f7fd19
indexer tests
brettwebst Apr 14, 2024
f156da8
Merge pull request #3 from brettwebst/issue-32-add-index-test
brettwebst Apr 14, 2024
8f7890e
Merge branch 'SciSharp:master' into master
brettwebst Apr 27, 2024
4180a8c
subtraction
brettwebst Apr 27, 2024
671dc47
Subtract, divide, and equals
brettwebst Jul 14, 2024
47539a6
DataFrame operators - equality
brettwebst Jul 21, 2024
2b7a6cc
Merge pull request #4 from brettwebst/issue-32-operator-test-2
brettwebst Jul 21, 2024
a81e505
added pop test
brettwebst Jul 27, 2024
345a42c
Merge pull request #5 from brettwebst/issue-32-pop-test
brettwebst Jul 27, 2024
3550ff8
Sample test added.
brettwebst Jul 27, 2024
e5fd6fc
Merge pull request #6 from brettwebst/issue-32-sample
brettwebst Jul 27, 2024
2aca3ab
Create ubuntu-dotnet.yml
brettwebst Jul 27, 2024
fd2e0df
Merge pull request #7 from brettwebst/brettwebst-patch-1
brettwebst Jul 27, 2024
0b014a5
Update ubuntu-dotnet.yml
brettwebst Jul 27, 2024
5bc0a74
Remove reference to TensorFlow.NET
brettwebst Jul 27, 2024
5a4ab95
Update PandasConsole.indexers.cs
brettwebst Jul 27, 2024
239d97b
Merge pull request #9 from brettwebst/brettwebst-patch-1
brettwebst Jul 27, 2024
1068652
ubuntu, windows, and macos ci
brettwebst Jul 27, 2024
1bb1df4
fixing macos file 1
brettwebst Jul 27, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
33 changes: 33 additions & 0 deletions .github/workflows/macos-ci.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
# This workflow will build a .NET project
# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-net

name: Build and Test
on:
push:
branches: [ "master" ]
pull_request:
branches: [ "master" ]

jobs:
build_matrix:
strategy:
matrix:
os:
- macos-latest

runs-on: ${{matrix.os}}

steps:
- uses: actions/checkout@v4
- name: Setup .NET
uses: actions/setup-dotnet@v4
with:
dotnet-version: 8.0.x
- name: Restore dependencies
run: dotnet restore
- name: SciSharp Mac OS Dependencies
run: Install-Package SciSharp.TensorFlow.Redist-OSX
- name: Build
run: dotnet build --no-restore
- name: Test
run: dotnet test --no-build --verbosity normal
32 changes: 32 additions & 0 deletions .github/workflows/ubuntu-windows-ci.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
# This workflow will build a .NET project
# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-net

name: Build and Test
on:
push:
branches: [ "master" ]
pull_request:
branches: [ "master" ]

jobs:
build_matrix:
strategy:
matrix:
os:
- ubuntu-latest
- windows-latest

runs-on: ${{matrix.os}}

steps:
- uses: actions/checkout@v4
- name: Setup .NET
uses: actions/setup-dotnet@v4
with:
dotnet-version: 8.0.x
- name: Restore dependencies
run: dotnet restore
- name: Build
run: dotnet build --no-restore
- name: Test
run: dotnet test --no-build --verbosity normal
26 changes: 26 additions & 0 deletions .vscode/launch.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
{
"version": "0.2.0",
"configurations": [
{
// Use IntelliSense to find out which attributes exist for C# debugging
// Use hover for the description of the existing attributes
// For further information visit https://github.com/dotnet/vscode-csharp/blob/main/debugger-launchjson.md
"name": ".NET Core Launch (console)",
"type": "coreclr",
"request": "launch",
"preLaunchTask": "build",
// If you have changed target frameworks, make sure to update the program path.
"program": "${workspaceFolder}/test/Pandas.NET.Test/bin/Debug/net8.0/Pandas.NET.Test.dll",
"args": [],
"cwd": "${workspaceFolder}/test/Pandas.NET.Test",
// For more information about the 'console' field, see https://aka.ms/VSCode-CS-LaunchJson-Console
"console": "internalConsole",
"stopAtEntry": false
},
{
"name": ".NET Core Attach",
"type": "coreclr",
"request": "attach"
}
]
}
41 changes: 41 additions & 0 deletions .vscode/tasks.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
{
"version": "2.0.0",
"tasks": [
{
"label": "build",
"command": "dotnet",
"type": "process",
"args": [
"build",
"${workspaceFolder}/Pandas.NET.sln",
"/property:GenerateFullPaths=true",
"/consoleloggerparameters:NoSummary;ForceNoAlign"
],
"problemMatcher": "$msCompile"
},
{
"label": "publish",
"command": "dotnet",
"type": "process",
"args": [
"publish",
"${workspaceFolder}/Pandas.NET.sln",
"/property:GenerateFullPaths=true",
"/consoleloggerparameters:NoSummary;ForceNoAlign"
],
"problemMatcher": "$msCompile"
},
{
"label": "watch",
"command": "dotnet",
"type": "process",
"args": [
"watch",
"run",
"--project",
"${workspaceFolder}/Pandas.NET.sln"
],
"problemMatcher": "$msCompile"
}
]
}
11 changes: 11 additions & 0 deletions src/Pandas.NET/Columns/Column.cs
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,17 @@ public class Column
public string Name { get; set; }
public Type DType { get; set; }


public Column()
{
}

public Column(string name, Type dtype)
{
Name = name;
DType = dtype;
}

public override string ToString()
=> $"{Name} {DType}";
}
Expand Down
6 changes: 6 additions & 0 deletions src/Pandas.NET/DataFrames/DataFrame.cs
Original file line number Diff line number Diff line change
Expand Up @@ -45,6 +45,12 @@ public DataFrame(List<Series> data, Series index = null, List<Column> columns =
index.size,
columns.Count
};

foreach (var s in _data)
{
s.SetIndex(_index);
}

}
}
}
27 changes: 27 additions & 0 deletions src/Pandas.NET/DataFrames/DataFrame.operator.cs
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,9 @@ public partial class DataFrame
{
data.Add(a.data[i] - b.data switch
{
double[] double64 => double64[i],
float[] float32 => float32[i],
int[] int32 => int32[i],
_ => throw new NotImplementedException("")
});
}
Expand All @@ -32,14 +34,26 @@ public partial class DataFrame
{
data.Add(a.data[i] / b.data switch
{
double[] double64 => double64[i],
float[] float32 => float32[i],
int[] int32 => int32[i],
_ => throw new NotImplementedException("")
});
}

return new DataFrame(data, index: a.index, columns: a.columns);
}

public static DataFrame operator *(DataFrame a, Series b)
{
var data = new List<Series>();
for(int i=0;i<a.data.Count; i++)
{
data.Add(a.data[i] * Convert.ToDouble(b.data.GetValue(i)));
}
return new DataFrame(data, index: a.index, columns: a.columns);
}

public static bool operator ==(DataFrame a, DataFrame b)
{
// do they have the same number of columns?
Expand Down Expand Up @@ -76,5 +90,18 @@ public partial class DataFrame
{
return !(a == b);
}

public override bool Equals(object obj)
{
return obj is DataFrame frame &&
data == frame.data &&
columns == frame.columns &&
index == frame.index;
}

public override int GetHashCode()
{
return HashCode.Combine(data, columns, index);
}
}
}
70 changes: 59 additions & 11 deletions src/Pandas.NET/DataFrames/DataFrame.sample.cs
Original file line number Diff line number Diff line change
@@ -1,28 +1,76 @@
using System;
using System.Collections;
using System.Collections.Generic;
using System.Linq;
using System.Reflection.PortableExecutable;
using Tensorflow.Util;

namespace PandasNet;

public partial class DataFrame
{
public DataFrame sample(float frac= 0.8f, int random_state = 0)
public DataFrame sample(int n = 0, float frac = 0, int random_state = 0, bool replace = false)
{
var rnd = new Random(random_state);
var n = (int)Math.Ceiling((1 - frac) * _index.size);
var excludeRowIndexArray = new int[n];
for (int i = 0; i < n; i++)
if (n == 0 && frac == 0)
{
throw new ArgumentException("Either n or frac should be greater than 0");
}
if (n != 0 && frac != 0)
{
throw new ArgumentException("Only one of n or frac should be greater than 0");
}
if (frac > 0)
{
excludeRowIndexArray[i] = rnd.Next(0, _index.size - 1);
n = (int)Math.Ceiling(frac * _index.size);
}
if (n > _index.size)
{
throw new ArgumentException("n should be less than the size of the DataFrame");
}

// treat axis as 0 for now. support for axis=1 should be added in the future
var rnd = new Random(random_state);

var data = new List<Series>();
// make a list that we can sample from
List<int> sampleIndex = null;

if(!replace){
// randomize the index and take the first n elements, no duplicates
sampleIndex = Enumerable
.Range(0, _index.size)
.OrderBy(arg => rnd.Next())
.Take(n).ToList();
}
else{
// for each sample, randomly select an index allowing duplicates
var sampleIndexes = Enumerable.Range(0, _index.size);
for (int i = 0; i < n; i++)
{
sampleIndex.Add(sampleIndexes.ElementAt(rnd.Next(0, sampleIndexes.Count()-1)));
}
}

// initialize a dictionary to hold the data
Dictionary<Column, ArrayList> data = new Dictionary<Column, ArrayList>();
foreach (var s in _data)
{
var series = s.drop(excludeRowIndexArray);
data.Add(series);
// init the array based on the dtype
ArrayList array =new ArrayList();
data.Add(s.column, array);
}

// fill the arrays with the sampled data
for (int i = 0; i < sampleIndex.Count; i++)
{
foreach (var s in _data)
{
data[s.column].Add(s.data.GetValue(sampleIndex[i]));
}
}
var index = _index.array<int>().Where(x => !excludeRowIndexArray.Contains(x)).ToArray();
return new DataFrame(data, columns: _columns, index: new Series(index));

// create a new DataFrame with the sampled data
DataFrame df = new DataFrame(data.Select(x => new Series(x.Value.ToArray(x.Key.DType), x.Key)).ToList(), index: new Series(sampleIndex.ToArray()));
return df;

}
}
1 change: 0 additions & 1 deletion src/Pandas.NET/Pandas.NET.csproj
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,5 @@
<PackageReference Include="MathNet.Numerics" Version="5.0.0" />
<PackageReference Include="SciSharp.TensorFlow.Redist" Version="2.16.0" />
<PackageReference Include="TensorFlow.Keras" Version="0.15.0" />
<PackageReference Include="TensorFlow.NET" Version="0.150.0" />
</ItemGroup>
</Project>
Loading
Loading