Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Audio PR - Augmentation support [ Non Silent Region Detection and Slice ] #1324

Merged
merged 193 commits into from
Jun 4, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
193 commits
Select commit Hold shift + click to select a range
83d5cbf
Bump rocm-docs-core[api_reference] from 0.34.0 to 0.34.2 in /docs/sph…
dependabot[bot] Feb 16, 2024
886684e
Bump cryptography from 42.0.0 to 42.0.2 in /docs/sphinx (#1289)
dependabot[bot] Feb 18, 2024
cf47a7f
Merge branch 'develop' of https://github.com/ROCm/MIVisionX into develop
Mar 13, 2024
f196208
Add PreEmphasis filter support
Mar 13, 2024
1e89c02
Fix ROI - change from xy to width & height
swetha097 Mar 13, 2024
d53f81d
Adding openvx changes for downmix node
SundarRajan28 Mar 13, 2024
9cef1ab
Audio Augmentations 1 PR - NSR and Spectrogram
swetha097 Mar 14, 2024
43dbde3
Revert "Adding openvx changes for downmix node"
swetha097 Mar 14, 2024
ba6ff14
Merging swbs_m2/audio/pr5 into swbs_m3/audio/pr6
swetha097 Mar 14, 2024
e94c53f
Fixing build issues
SundarRajan28 Mar 15, 2024
e63809c
Adding openvx extensions for to_decibels and normalize augmentations
SundarRajan28 Mar 15, 2024
589c823
Commenting out normalize kernel
SundarRajan28 Mar 18, 2024
7f77d64
Adding openvx extensions for resample and operator overloading nodes
SundarRajan28 Mar 18, 2024
b19a9ad
PR comments resolution in the PreEmphais Filter
swetha097 Mar 19, 2024
e92ffe4
Minor Changes
swetha097 Mar 20, 2024
b94144c
Change the borderType enum to int32 from uint32 dtype
swetha097 Mar 21, 2024
5808d6b
Fix validation of preemphasis
swetha097 Mar 21, 2024
33eb1ce
Remove the memcopy of the src and dest rois as it can be handled in t…
swetha097 Mar 21, 2024
8c4a98e
Formatting change - minor
swetha097 Mar 21, 2024
a58818e
Remove NSR
swetha097 Mar 22, 2024
e76b212
Merge branch 'swbs_m1/audio/pr3' into swbs_m2/audio/pr5
swetha097 Mar 22, 2024
c6dcd6b
Minor formatting changes
swetha097 Mar 22, 2024
4e3654a
Minor fix
swetha097 Mar 22, 2024
4495d5c
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 22, 2024
247cf70
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 22, 2024
e197789
Minor update - remove the 2nd instance of preemphasis filter
swetha097 Mar 22, 2024
1a51fee
Add openvx extensions for to_decibels augmentations
SundarRajan28 Mar 22, 2024
dba24ba
Enum dtype - change from uint to int
swetha097 Mar 22, 2024
6615b27
Remove roi_tensor_ptr_dst as its unused after latest changes
swetha097 Mar 22, 2024
84100bd
Remove the dst_roi arg from vxExtRppPreemphasisFilter call as its unused
swetha097 Mar 22, 2024
e8ff20e
Merge branch 'swbs_m1/audio/pr3' into swbs_m3/audio/pr6
SundarRajan28 Mar 25, 2024
dc4200b
Add MFB to MIVisisonX
swetha097 Mar 25, 2024
8c50b93
Revert "Add MFB to MIVisisonX"
swetha097 Mar 25, 2024
a649fba
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 25, 2024
01aba8a
Fixing issues with src ROI
SundarRajan28 Mar 25, 2024
0bc6e73
Merge branch 'swbs_m1/audio/pr3' into swbs_m2/audio/pr5
swetha097 Mar 25, 2024
854aa50
Resolve the PR comments
swetha097 Mar 25, 2024
a25b645
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 25, 2024
68a5d7e
Resolving review comments
SundarRajan28 Mar 25, 2024
ebe8933
Resolving review comments
SundarRajan28 Mar 25, 2024
886d6af
Change the dims[0] and dims[1] positioning for Spectrogram and AudioF…
swetha097 Mar 25, 2024
a446bff
Removing dstROI from to_decibels openvx augmentation
SundarRajan28 Mar 25, 2024
86aa2d3
Change function name to camelCase
swetha097 Mar 25, 2024
ce4778f
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 25, 2024
070bd82
Resolving review comments
SundarRajan28 Mar 25, 2024
704807f
Revert "Change the dims[0] and dims[1] positioning for Spectrogram an…
swetha097 Mar 26, 2024
658504f
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 26, 2024
7c47fdd
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 Mar 26, 2024
6919be6
Removing normalize node and adding formatting changes
SundarRajan28 Mar 26, 2024
e766dff
Fix Spectrogram
Mar 26, 2024
7f9e423
Merge branch 'swbs_m2/audio/pr5' of https://github.com/swetha097/MIVi…
Mar 26, 2024
a2c1063
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Mar 26, 2024
b2a6d58
NWC
swetha097 Mar 26, 2024
0a4f5b2
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 Mar 27, 2024
ff041d4
Adding resampling window calculation in openvx
SundarRajan28 Mar 29, 2024
a1a0d4d
NSR + SLice
swetha097 Mar 29, 2024
af230bd
Merge remote-tracking branch 'swe_fork/swbs_m5/audio/pr8' into swbs_m…
swetha097 Mar 29, 2024
32304a1
Updating resample node with latest changes
SundarRajan28 Mar 29, 2024
2977423
Resolving review comments
SundarRajan28 Apr 1, 2024
6844edf
Fixing ROI issues with TensorTensorAdd node
SundarRajan28 Apr 1, 2024
80568eb
Resolving review comments
SundarRajan28 Apr 1, 2024
4f43bf6
Fix Slice
swetha097 Apr 2, 2024
e0a8349
Remove commented code in Slice.cpp
swetha097 Apr 2, 2024
02e9f66
Modifying pSrcROI in Resample openvx
SundarRajan28 Apr 2, 2024
0fc8e2f
Merge remote-tracking branch 'swe_fork/swbs_m5/audio/pr8' into swbs_m…
swetha097 Apr 2, 2024
f33f679
Change the name NonSilentRegion to NonSilentRegionDetection
swetha097 Apr 2, 2024
cec154b
Remove the ND kernel layouts
swetha097 Apr 2, 2024
0fe6488
Adding comments for tensor tensor add openvx node
SundarRajan28 Apr 2, 2024
d0c09cc
Code clean up
swetha097 Apr 2, 2024
6f377a0
Resolve PR comments - 1
swetha097 Apr 2, 2024
76c90ee
Change ENUM from UINT to INT
swetha097 Apr 2, 2024
8f64b63
Minor change in the name of the desc ptr
swetha097 Apr 3, 2024
7f84251
Minor changes - resolve PR comments
swetha097 Apr 3, 2024
88d5048
Merge remote-tracking branch 'swe_fork/swbs_m5/audio/pr8' into swbs_m…
swetha097 Apr 3, 2024
1efbb5e
Minor changes to remove width usage
swetha097 Apr 3, 2024
9c01b0e
Resolve PR comments
swetha097 Apr 3, 2024
eb7ab70
Minor changes
swetha097 Apr 3, 2024
dd6eceb
Docs - update TOC for API Ref (#1327)
randyh62 Apr 9, 2024
724ebbf
Bump rocm-docs-core[api_reference] from 0.38.0 to 0.38.1 in /docs/sph…
dependabot[bot] Apr 11, 2024
a592da3
Update CHANGELOG.md
swetha097 Apr 11, 2024
d15cd67
Merge remote-tracking branch 'swe_fork/swbs_m1/audio/pr3' into swbs_m…
swetha097 Apr 11, 2024
3252e48
Update CHANGELOG.md
swetha097 Apr 11, 2024
f387e49
Documents - Bump idna from 3.4 to 3.7 in /docs/sphinx (#1330)
dependabot[bot] Apr 12, 2024
ebd1121
Fix slice layout issue
swetha097 Apr 15, 2024
b08b602
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Apr 16, 2024
3be53bf
Update changelog
SundarRajan28 Apr 16, 2024
cbcac89
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 Apr 16, 2024
e1d7f8e
Update changelog
SundarRajan28 Apr 16, 2024
a2b4867
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 Apr 16, 2024
d709bcb
Update changelog
SundarRajan28 Apr 16, 2024
3a09b7f
Merge remote-tracking branch 'upstream/develop' into swbs_m1/audio/pr3
SundarRajan28 Apr 17, 2024
ca43743
Merge branch 'swbs_m1/audio/pr3' into swbs_m2/audio/pr5
SundarRajan28 Apr 17, 2024
c69afd8
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Apr 17, 2024
b54cd21
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 Apr 17, 2024
990d92f
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 Apr 17, 2024
d0691b6
Update changelog
SundarRajan28 Apr 17, 2024
f46e48e
Merge branch 'swbs_m1/audio/pr3' into swbs_m2/audio/pr5
SundarRajan28 Apr 17, 2024
58d8c0d
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 Apr 17, 2024
e54a877
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 Apr 17, 2024
3053f86
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 Apr 17, 2024
80b55a5
Merge remote-tracking branch 'upstream/develop' into HEAD
swetha097 Apr 18, 2024
1e92a6c
Merge branch 'develop' into swbs_m1/audio/pr3
swetha097 Apr 18, 2024
83991ea
Resolve minor PR comments
swetha097 Apr 18, 2024
731d7a6
Merge branch 'swbs_m1/audio/pr3' into swbs_m2/audio/pr5
swetha097 Apr 18, 2024
5112ca8
Remove comments
swetha097 Apr 18, 2024
5532aae
Docs - Bump tqdm from 4.65.0 to 4.66.3 in /docs/sphinx (#1339)
dependabot[bot] May 3, 2024
bad8d31
Docs - Bump jinja2 from 3.1.3 to 3.1.4 in /docs/sphinx (#1340)
dependabot[bot] May 6, 2024
7ef3c3c
Find Half - Fix (#1341)
kiritigowda May 7, 2024
2358357
MIVisionX Setup - Updates (#1343)
kiritigowda May 8, 2024
7e8fbf5
Merge remote-tracking branch 'upstream/develop' into swbs_m2/audio/pr5
swetha097 May 8, 2024
4121a9c
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
swetha097 May 8, 2024
954eaa9
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
swetha097 May 8, 2024
3088822
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
swetha097 May 8, 2024
cab620b
SWDEV-459739 - Remove the package obsolete setting (#1345)
raramakr May 9, 2024
efdc885
Fix the layout issue with spec
swetha097 May 9, 2024
b4f93d1
Add layouts for Audio in vxTensorLayout
fiona-gladwin May 9, 2024
1d52b52
Merge branch 'swbs_m2/audio/pr5' of https://github.com/swetha097/MIVi…
fiona-gladwin May 9, 2024
212df74
Check the validity of pointers
swetha097 May 9, 2024
c0ce635
Validate the pointers for NSR and Slice
swetha097 May 9, 2024
fccd77d
Audio PR - Augmentation support [ Spectrogram ] (#1319)
swetha097 May 9, 2024
33a04d3
Introduce API to obtain RPP layout
fiona-gladwin May 9, 2024
d7db0cb
Merge remote-tracking branch 'upstream/develop' into swbs_m3/audio/pr6
SundarRajan28 May 10, 2024
99c7303
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 10, 2024
b1289ad
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 May 10, 2024
c396ead
Merge branch 'swbs_m2/audio/pr5' into swbs_m2/audio/pr5_layout
fiona-gladwin May 10, 2024
beba826
Add comments
fiona-gladwin May 10, 2024
5b75eed
Merge branch 'develop' of https://github.com/GPUOpen-ProfessionalComp…
fiona-gladwin May 10, 2024
81c5533
Resolving review comments
SundarRajan28 May 13, 2024
209b83a
Merge remote-tracking branch 'swbs_m2/audio/pr5_layout' into swbs_m3/…
SundarRajan28 May 13, 2024
b95c25a
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 13, 2024
2090e0b
Resolving review comments
SundarRajan28 May 13, 2024
e0883dd
Resolving review comments
SundarRajan28 May 14, 2024
1d1baeb
Resolving review comments
SundarRajan28 May 14, 2024
4b8ac7f
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 15, 2024
a849125
Minor changes
SundarRajan28 May 15, 2024
2502bc8
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 15, 2024
36fdc89
Removing if blocks for CPU device checks
SundarRajan28 May 15, 2024
99eeb10
Merge remote-tracking branch 'upstream/develop' into swbs_m3/audio/pr6
SundarRajan28 May 17, 2024
8bdad24
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 17, 2024
5036752
Merge remote-tracking branch 'origin/swbs_m5/audio/pr8' into swbs_m6/…
swetha097 May 17, 2024
ec5eb7c
Fix the build issue with merge of pr8 into pr9
swetha097 May 17, 2024
96bc055
Fix Slice kernel changes wrt recent merge
swetha097 May 17, 2024
06108e9
Minor change - remove NONE layout from MIVisionX
swetha097 May 17, 2024
9cf73d6
Merge branch 'swbs_m2/audio/pr5_layout' into swbs_m2/audio/pr5
fiona-gladwin May 17, 2024
b0f7289
Merge branch 'develop' of https://github.com/GPUOpen-ProfessionalComp…
fiona-gladwin May 20, 2024
2f33913
Use RPP_AUDIO flag to disable RPP audio calls
fiona-gladwin May 20, 2024
fefc759
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
fiona-gladwin May 20, 2024
ff3c50f
Add RPP_AUDIO flag for RPP audio API
fiona-gladwin May 20, 2024
cc9c1ce
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
fiona-gladwin May 20, 2024
1d0382c
Add RPP_AUDIO flag for RPP audio API
fiona-gladwin May 20, 2024
b3e53f5
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
fiona-gladwin May 20, 2024
a75d775
Add RPP_AUDIO flag for RPP audio API
fiona-gladwin May 20, 2024
540735f
Add RPP_AUDIO flag for slice
fiona-gladwin May 20, 2024
a525fce
Add Audio flag for PreEmphasis filter
fiona-gladwin May 20, 2024
7186b66
Revert "Add RPP_AUDIO flag for slice"
fiona-gladwin May 20, 2024
cfd5a7d
Minor changes
fiona-gladwin May 20, 2024
3f8d1c8
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
fiona-gladwin May 20, 2024
2613545
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
fiona-gladwin May 20, 2024
69ba07e
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
fiona-gladwin May 20, 2024
1897ec6
Minor fix
fiona-gladwin May 20, 2024
f1cb901
Merge remote-tracking branch 'upstream/develop' into swbs_m3/audio/pr6
SundarRajan28 May 22, 2024
fe22146
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 22, 2024
89237f3
Merge branch 'develop' into swbs_m2/audio/pr5
SundarRajan28 May 22, 2024
abe90cb
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 May 22, 2024
13989e7
Merge branch 'develop' into swbs_m2/audio/pr5
SundarRajan28 May 24, 2024
f601ad9
Merge branch 'develop' into swbs_m3/audio/pr6
SundarRajan28 May 24, 2024
26360e9
Merge branch 'develop' into swbs_m5/audio/pr8
SundarRajan28 May 24, 2024
9d4c979
Merge branch 'develop' into swbs_m6/audio/pr9
SundarRajan28 May 24, 2024
7ac933f
Merge branch 'develop' into swbs_m2/audio/pr5
LakshmiKumar23 May 28, 2024
b1c7694
Merge branch 'swbs_m2/audio/pr5' into swbs_m3/audio/pr6
SundarRajan28 May 29, 2024
9832085
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 29, 2024
bb7249d
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 May 29, 2024
f4dd4e3
Merge remote-tracking branch 'upstream/develop' into swbs_m3/audio/pr6
SundarRajan28 May 29, 2024
5bb4fd3
Merge branch 'swbs_m3/audio/pr6' into swbs_m5/audio/pr8
SundarRajan28 May 29, 2024
72fff96
Merge branch 'swbs_m5/audio/pr8' into swbs_m6/audio/pr9
SundarRajan28 May 29, 2024
cbf5fa9
Merge remote-tracking branch 'upstream/develop' into swbs_m6/audio/pr9
SundarRajan28 May 30, 2024
e8a9cc9
Merge remote-tracking branch 'upstream/develop' into swbs_m6/audio/pr9
SundarRajan28 May 30, 2024
338b7b8
Change map variable name
SundarRajan28 May 30, 2024
b0d90f6
Merge branch 'develop' into swbs_m6/audio/pr9
LakshmiKumar23 Jun 3, 2024
bb0dc29
Merge remote-tracking branch 'upstream/develop' into swbs_m6/audio/pr9
swetha097 Jun 3, 2024
428913d
Merge branch 'swbs_m6/audio/pr9' of https://github.com/swetha097/MIVi…
swetha097 Jun 3, 2024
c1434c8
Add audio flag for slice
fiona-gladwin Jun 3, 2024
ae2d74d
Merge branch 'swbs_m6/audio/pr9' of https://github.com/swetha097/MIVi…
fiona-gladwin Jun 3, 2024
72704fd
Remove the exit label
swetha097 Jun 3, 2024
7b2062d
Merge branch 'swbs_m6/audio/pr9' of https://github.com/swetha097/MIVi…
swetha097 Jun 3, 2024
d9e4045
Modify the redundant lines of fillGenericDescPtrFromDims
swetha097 Jun 3, 2024
3e666cb
Ad the label exit back
swetha097 Jun 3, 2024
99b30fb
Merge branch 'develop' of https://github.com/GPUOpen-ProfessionalComp…
fiona-gladwin Jun 3, 2024
6f811f3
Make the right Copyright change reverted in previous commit
swetha097 Jun 3, 2024
f12ca98
Merge branch 'swbs_m6/audio/pr9' of https://github.com/swetha097/MIVi…
swetha097 Jun 3, 2024
655463f
Add audio flag for slice
fiona-gladwin Jun 3, 2024
f32635a
Merge branch 'swbs_m6/audio/pr9' of https://github.com/swetha097/MIVi…
fiona-gladwin Jun 3, 2024
d7cefcd
Merge branch 'develop' into swbs_m6/audio/pr9
kiritigowda Jun 4, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@ Documentation for MIVisionX is available at
* Support for Spectrogram augmentation in openVX extensions
* Support for Downmix and ToDecibels augmentations in openVX extensions
* Support for Resample augmentation and Operator overloading nodes in openVX extensions
* Support for NonSilentRegion and Slice augmentations in openVX extensions

### Optimizations

Expand Down
2 changes: 2 additions & 0 deletions amd_openvx_extensions/amd_rpp/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -146,6 +146,7 @@ list(APPEND SOURCES
source/tensor/Jitter.cpp
source/tensor/LensCorrection.cpp
source/tensor/Noise.cpp
source/tensor/NonSilentRegionDetection.cpp
source/tensor/Nop.cpp
source/tensor/Rotate.cpp
source/tensor/Pixelate.cpp
Expand All @@ -165,6 +166,7 @@ list(APPEND SOURCES
source/tensor/ToDecibels.cpp
source/tensor/Vignette.cpp
source/tensor/WarpAffine.cpp
source/tensor/Slice.cpp
source/kernel_rpp.cpp
source/internal_publishKernels.cpp
)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -162,6 +162,8 @@ vx_status ToDecibels_Register(vx_context);
vx_status Resample_Register(vx_context);
vx_status TensorMulScalar_Register(vx_context);
vx_status TensorAddTensor_Register(vx_context);
vx_status NonSilentRegionDetection_Register(vx_context);
vx_status Slice_Register(vx_context);

// kernel names
#define VX_KERNEL_RPP_NOPBATCHPD_NAME "org.rpp.NopbatchPD"
Expand Down Expand Up @@ -293,5 +295,7 @@ vx_status TensorAddTensor_Register(vx_context);
#define VX_KERNEL_RPP_RESAMPLE_NAME "org.rpp.Resample"
#define VX_KERNEL_RPP_TENSORMULSCALAR_NAME "org.rpp.TensorMulScalar"
#define VX_KERNEL_RPP_TENSORADDTENSOR_NAME "org.rpp.TensorAddTensor"
#define VX_KERNEL_RPP_NONSILENTREGIONDETECTION_NAME "org.rpp.NonSilentRegionDetection"
#define VX_KERNEL_RPP_SLICE_NAME "org.rpp.Slice"

#endif //_AMDVX_EXT__PUBLISH_KERNELS_H_
3 changes: 2 additions & 1 deletion amd_openvx_extensions/amd_rpp/include/internal_rpp.h
Original file line number Diff line number Diff line change
Expand Up @@ -92,7 +92,8 @@ vx_node createNode(vx_graph graph, vx_enum kernelEnum, vx_reference params[], vx
vx_status createRPPHandle(vx_node node, vxRppHandle ** pHandle, Rpp32u batchSize, Rpp32u deviceType);
vx_status releaseRPPHandle(vx_node node, vxRppHandle * handle, Rpp32u deviceType);
void fillDescriptionPtrfromDims(RpptDescPtr &descPtr, vxTensorLayout layout, size_t *tensorDims);
void fillAudioDescriptionPtrFromDims(RpptDescPtr &descPtr, size_t *tensorDims, vxTensorLayout layout = vxTensorLayout::VX_NHW);
void fillGenericDescriptionPtrfromDims(RpptGenericDescPtr &genericDescPtr, vxTensorLayout layout, size_t *maxTensorDims);
swetha097 marked this conversation as resolved.
Show resolved Hide resolved
void fillAudioDescriptionPtrFromDims(RpptDescPtr &descPtr, size_t *maxTensorDims, vxTensorLayout layout = vxTensorLayout::VX_NHW);
RpptDataType getRpptDataType(vx_enum dataType);

class Kernellist
Expand Down
4 changes: 3 additions & 1 deletion amd_openvx_extensions/amd_rpp/include/kernels_rpp.h
Original file line number Diff line number Diff line change
Expand Up @@ -154,7 +154,9 @@ extern "C"
VX_KERNEL_RPP_TODECIBELS = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x77,
VX_KERNEL_RPP_RESAMPLE = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x78,
VX_KERNEL_RPP_TENSORMULSCALAR = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x79,
VX_KERNEL_RPP_TENSORADDTENSOR = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x7a
VX_KERNEL_RPP_TENSORADDTENSOR = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x7a,
VX_KERNEL_RPP_NONSILENTREGIONDETECTION = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x7b,
VX_KERNEL_RPP_SLICE = VX_KERNEL_BASE(VX_ID_AMD, VX_LIBRARY_RPP) + 0x7c,
};

#ifdef __cplusplus
Expand Down
32 changes: 32 additions & 0 deletions amd_openvx_extensions/amd_rpp/include/vx_ext_rpp.h
Original file line number Diff line number Diff line change
Expand Up @@ -1957,6 +1957,38 @@ extern "C"
*/
SHARED_PUBLIC vx_node VX_API_CALL vxExtRppTensorAddTensor(vx_graph graph, vx_tensor pSrc1, vx_tensor pSrc2, vx_tensor pDst, vx_tensor pSrcRoi, vx_tensor pDstRoi);

/*! \brief [Graph] Performs leading and trailing silence detection to the input tensor.
* \ingroup group_amd_rpp
* \param [in] graph The handle to the graph.
* \param [in] pSrc The input tensor in <tt>\ref VX_TYPE_FLOAT32</tt> format data.
* \param [in] pSrcRoi The input tensor in <tt>unsigned int<tt> containing the roi values for each input in the format <begin_dim1, begin_dim2 .., length_dim1, length_dim2> format for each dimension.
* \param [out] pBegin The output tensor containing begin values of the non-silent region of the audio-data in <tt>\ref VX_TYPE_INT32</tt> format data.
* \param [out] pLength The output tensor containing length values of the non-silent region of the audio-data in <tt>\ref VX_TYPE_INT32</tt> format data.
* \param [in] cutOffDB The input scalar in <tt>\ref VX_TYPE_FLOAT32</tt> format containing the threshold, in dB, below which the signal is considered silent.
* \param [in] referencePower The input scalar in <tt>\ref VX_TYPE_FLOAT32</tt> format containing the reference power used for converting the signal to dB.
* \param [in] windowLength The input scalar in <tt>\ref VX_TYPE_INT32</tt> format containing the size of the sliding window.
* \param [in] resetInterval The input scalar in <tt>\ref VX_TYPE_INT32</tt> format containing the frequency at which the moving mean average is recalculated to mitigate precision loss.
* \return A node reference <tt>\ref vx_node</tt>. Any possible errors preventing a successful creation should be checked using <tt>\ref vxGetStatus</tt>.
*/
SHARED_PUBLIC vx_node VX_API_CALL vxExtRppNonSilentRegionDetection(vx_graph graph, vx_tensor pSrc, vx_tensor pSrcRoi, vx_tensor pDst1, vx_tensor pDst2, vx_scalar cutOffDB, vx_scalar referencePower, vx_scalar windowLength, vx_scalar resetInterval);

/*! \brief [Graph] Slice's the input tensor using anchors and shapes values
* \ingroup group_amd_rpp
* \param [in] graph The handle to the graph.
* \param [in] pSrc The input tensor in <tt>\ref VX_TYPE_UINT8</tt> or <tt>\ref VX_TYPE_FLOAT32</tt> format data.
* \param [in] pSrcRoi The input tensor in <tt>unsigned int<tt> format containing the roi values for the input format <begin_dim1, begin_dim2 .., length_dim1, length_dim2> format for each dimension.
* \param [out] pDst The output tensor in <tt>\ref VX_TYPE_UINT8</tt> or <tt>\ref VX_TYPE_FLOAT32</tt> format data.
* \param [in] pDstRoi The input tensor in <tt>unsigned int<tt> format containing the roi values for the output tensor format <begin_dim1, begin_dim2 .., length_dim1, length_dim2> format for each dimension.
* \param [in] pAnchor The input array in <tt>\ref VX_TYPE_INT32</tt> format containing the absolute coordinates for the starting point of the slice.
* \param [in] pShape The input array in <tt>\ref VX_TYPE_INT32</tt> format containing the absolute coordinates for the dimensions of the slice
* \param [in] pFillValue The input array in <tt>\ref VX_TYPE_INT32</tt> format which determines the values to be padded and is only relevant if policy is set to “pad”.
* \param [in] policy The input scalar in <tt>\ref VX_TYPE_INT32</tt> format which determines the policy when slicing the out of bounds area of the input. The values can be "error", "pad", "trim_to_shape"
* \param [in] inputLayout The input scalar in <tt>\ref VX_TYPE_INT32</tt> format containing the layout of the input tensor.
* \param [in] roiType The input scalar in <tt>\ref VX_TYPE_INT32</tt> format containing the roi type which can be ltrb/xywh.
* \return A node reference <tt>\ref vx_node</tt>. Any possible errors preventing a successful creation should be checked using <tt>\ref vxGetStatus</tt>.
*/
SHARED_PUBLIC vx_node VX_API_CALL vxExtRppSlice(vx_graph graph, vx_tensor pSrc, vx_tensor pSrcRoi, vx_tensor pDst, vx_tensor pDstRoi, vx_tensor pAnchor, vx_tensor pShape, vx_array pFillValue, vx_scalar policy, vx_scalar inputLayout, vx_scalar roiType);

#ifdef __cplusplus
}
#endif
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,7 +167,8 @@ vx_status get_kernels_to_publish()
STATUS_ERROR_CHECK(ADD_KERNEL(Resample_Register));
STATUS_ERROR_CHECK(ADD_KERNEL(TensorMulScalar_Register));
STATUS_ERROR_CHECK(ADD_KERNEL(TensorAddTensor_Register));

STATUS_ERROR_CHECK(ADD_KERNEL(NonSilentRegionDetection_Register));
STATUS_ERROR_CHECK(ADD_KERNEL(Slice_Register));
return status;
}

Expand Down
64 changes: 64 additions & 0 deletions amd_openvx_extensions/amd_rpp/source/kernel_rpp.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2584,6 +2584,51 @@ VX_API_ENTRY vx_node VX_API_CALL vxExtRppSpectrogram(vx_graph graph, vx_tensor p
return node;
}

VX_API_ENTRY vx_node VX_API_CALL vxExtRppNonSilentRegionDetection(vx_graph graph, vx_tensor pSrc, vx_tensor pSrcRoi, vx_tensor pBegin, vx_tensor pLength, vx_scalar cutOffDB, vx_scalar referencePower, vx_scalar windowLength, vx_scalar resetInterval) {
vx_node node = NULL;
vx_context context = vxGetContext((vx_reference)graph);
if (vxGetStatus((vx_reference)context) == VX_SUCCESS) {
vx_uint32 devType = getGraphAffinity(graph);
vx_scalar deviceType = vxCreateScalar(vxGetContext((vx_reference)graph), VX_TYPE_UINT32, &devType);
vx_reference params[] = {
(vx_reference)pSrc,
(vx_reference)pSrcRoi,
(vx_reference)pBegin,
(vx_reference)pLength,
(vx_reference)cutOffDB,
(vx_reference)referencePower,
(vx_reference)windowLength,
(vx_reference)resetInterval,
(vx_reference)deviceType};
node = createNode(graph, VX_KERNEL_RPP_NONSILENTREGIONDETECTION, params, 9);
}
return node;
}

VX_API_ENTRY vx_node VX_API_CALL vxExtRppSlice(vx_graph graph, vx_tensor pSrc, vx_tensor pSrcRoi, vx_tensor pDst, vx_tensor pDstRoi, vx_tensor pAnchor, vx_tensor pShape,
vx_array pFillValue, vx_scalar policy, vx_scalar inputLayout, vx_scalar roiType) {
vx_node node = NULL;
vx_context context = vxGetContext((vx_reference)graph);
if (vxGetStatus((vx_reference)context) == VX_SUCCESS) {
vx_uint32 devType = getGraphAffinity(graph);
vx_scalar deviceType = vxCreateScalar(vxGetContext((vx_reference)graph), VX_TYPE_UINT32, &devType);
vx_reference params[] = {
(vx_reference)pSrc,
(vx_reference)pSrcRoi,
(vx_reference)pDst,
(vx_reference)pDstRoi,
(vx_reference)pAnchor,
(vx_reference)pShape,
(vx_reference)pFillValue,
(vx_reference)policy,
(vx_reference)inputLayout,
(vx_reference)roiType,
(vx_reference)deviceType};
node = createNode(graph, VX_KERNEL_RPP_SLICE, params, 11);
}
return node;
}

VX_API_ENTRY vx_node VX_API_CALL vxExtRppDownmix(vx_graph graph, vx_tensor pSrc, vx_tensor pDst, vx_tensor pSrcRoi) {
vx_node node = NULL;
vx_context context = vxGetContext((vx_reference)graph);
Expand Down Expand Up @@ -2762,6 +2807,25 @@ void fillAudioDescriptionPtrFromDims(RpptDescPtr &descPtr, size_t *maxTensorDims
}
}

swetha097 marked this conversation as resolved.
Show resolved Hide resolved
void fillGenericDescriptionPtrfromDims(RpptGenericDescPtr &genericDescPtr, vxTensorLayout layout, size_t *maxTensorDims) {
if (layout != vxTensorLayout::VX_NHW && layout != vxTensorLayout::VX_NFT && layout != vxTensorLayout::VX_NTF)
throw std::runtime_error("Invalid layout value in fillGenericDescriptionPtrfromDims, currently supports only NHW/NFT/NTF layouts");
else if(tensorLayoutMapping.find(layout) != tensorLayoutMapping.end())
genericDescPtr->layout = tensorLayoutMapping.at(layout);

genericDescPtr->dims[0] = maxTensorDims[0];
genericDescPtr->dims[1] = maxTensorDims[1];
genericDescPtr->dims[2] = maxTensorDims[2];
genericDescPtr->dims[3] = 1;
if(genericDescPtr->dims[2] == 1)
genericDescPtr->numDims = 2;
else
genericDescPtr->numDims = 3;
genericDescPtr->strides[0] = genericDescPtr->dims[1] * genericDescPtr->dims[2] * genericDescPtr->dims[3];
genericDescPtr->strides[1] = genericDescPtr->dims[2] * genericDescPtr->dims[3];
genericDescPtr->strides[2] = genericDescPtr->dims[3];
}

// utility functions
vx_node createNode(vx_graph graph, vx_enum kernelEnum, vx_reference params[], vx_uint32 num)
{
Expand Down
Loading